Update README.md
Browse files
README.md
CHANGED
|
@@ -13,4 +13,39 @@ datasets:
|
|
| 13 |
- espnet/yodas
|
| 14 |
---
|
| 15 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 16 |
Original repo: https://github.com/SWivid/F5-TTS
|
|
|
|
| 13 |
- espnet/yodas
|
| 14 |
---
|
| 15 |
|
| 16 |
+
## How to use (example):
|
| 17 |
+
|
| 18 |
+
```python
|
| 19 |
+
!pip install git+https://github.com/SWivid/F5-TTS.git
|
| 20 |
+
|
| 21 |
+
|
| 22 |
+
model_id = "TVI/f5-tts-ru-accent"
|
| 23 |
+
download_dir = "ckpts" # You can replace
|
| 24 |
+
|
| 25 |
+
!huggingface-cli download {model_id} --local-dir {download_dir}
|
| 26 |
+
|
| 27 |
+
|
| 28 |
+
model = "F5TTS_v1_Base"
|
| 29 |
+
ckpt_file = "/content/ckpts/model_last.safetensors"
|
| 30 |
+
vocab_file = "/content/ckpts/vocab.txt"
|
| 31 |
+
ref_audio = "PATH_TO_REF"
|
| 32 |
+
ref_text = f"REF TRANSCRIBE or EMPTY"
|
| 33 |
+
gen_text = "YOUR TEXT"
|
| 34 |
+
wav_output_dir = "OUTPUT_FOLDER"
|
| 35 |
+
wav_output_filename = "OUTPUT_FILE.wav"
|
| 36 |
+
speed = 1.0
|
| 37 |
+
|
| 38 |
+
command = (
|
| 39 |
+
f'f5-tts_infer-cli --model {model} --ckpt_file "{ckpt_file}" '
|
| 40 |
+
f'--vocab_file "{vocab_file}" -r "{ref_audio}" -s "{ref_text}" '
|
| 41 |
+
f'-t "{gen_text}" -o "{wav_output_dir}" -w "{wav_output_filename}" '
|
| 42 |
+
f'--speed {speed} --remove_silence'
|
| 43 |
+
)
|
| 44 |
+
|
| 45 |
+
print(command)
|
| 46 |
+
|
| 47 |
+
!{command}
|
| 48 |
+
|
| 49 |
+
```
|
| 50 |
+
|
| 51 |
Original repo: https://github.com/SWivid/F5-TTS
|