Update README.md
Browse files
README.md
CHANGED
|
@@ -30,7 +30,7 @@ wav_path = "test-mini-audios/3fe64f3d-282c-4bc8-a753-68f8f6c35652.wav" # from M
|
|
| 30 |
waveform, _ = torchaudio.load(wav_path) # 16KHz
|
| 31 |
audios = [waveform[0].numpy()]
|
| 32 |
|
| 33 |
-
# Make prompt
|
| 34 |
question = "Based on the given audio, identify the source of the speaking voice."
|
| 35 |
options = ["Man", "Woman", "Child", "Robot"]
|
| 36 |
prompt = f"{question} Please choose the answer from the following options: {str(options)}. Output the final answer in <answer> </answer>."
|
|
@@ -40,6 +40,7 @@ message = [
|
|
| 40 |
{"type": "text", "text": prompt}
|
| 41 |
]}
|
| 42 |
]
|
|
|
|
| 43 |
|
| 44 |
# Process
|
| 45 |
inputs = processor(text=texts, audios=audios, sampling_rate=16000, return_tensors="pt", padding=True).to(model.device)
|
|
|
|
| 30 |
waveform, _ = torchaudio.load(wav_path) # 16KHz
|
| 31 |
audios = [waveform[0].numpy()]
|
| 32 |
|
| 33 |
+
# Make prompt text
|
| 34 |
question = "Based on the given audio, identify the source of the speaking voice."
|
| 35 |
options = ["Man", "Woman", "Child", "Robot"]
|
| 36 |
prompt = f"{question} Please choose the answer from the following options: {str(options)}. Output the final answer in <answer> </answer>."
|
|
|
|
| 40 |
{"type": "text", "text": prompt}
|
| 41 |
]}
|
| 42 |
]
|
| 43 |
+
texts = processor.apply_chat_template(message, add_generation_prompt=True, tokenize=False)
|
| 44 |
|
| 45 |
# Process
|
| 46 |
inputs = processor(text=texts, audios=audios, sampling_rate=16000, return_tensors="pt", padding=True).to(model.device)
|