update prompt for decoding

This commit is contained in:
Yuekai Zhang 2024-06-07 10:57:35 +08:00
parent 40e4ac480c
commit 16f18080be

View File

@ -280,10 +280,14 @@ def decode_one_batch(
feature_len = feature_len.to(device, dtype=dtype)
messages = [[
{"role": "system", "content": "你是一个能处理音频的助手。"},
{"role": "user", "content": f"请转写音频为文字 {DEFAULT_SPEECH_TOKEN}"},
{"role": "user", "content": f"{DEFAULT_SPEECH_TOKEN}请转写音频为文字"},
{"role": "assistant", "content": ""},
]] * len(feature)
# messages = [[
# {"role": "system", "content": "你是一个能处理音频的助手。"},
# {"role": "user", "content": f"请转写音频为文字 {DEFAULT_SPEECH_TOKEN}"},
# {"role": "assistant", "content": ""},
# ]] * len(feature)
input_ids, attention_mask = preprocess(
messages, tokenizer, max_len=128