Update README.md
Browse files
README.md
CHANGED
@@ -13,4 +13,39 @@ datasets:
|
|
13 |
- espnet/yodas
|
14 |
---
|
15 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
16 |
Original repo: https://github.com/SWivid/F5-TTS
|
|
|
13 |
- espnet/yodas
|
14 |
---
|
15 |
|
16 |
+
## How to use (example):
|
17 |
+
|
18 |
+
```python
|
19 |
+
!pip install git+https://github.com/SWivid/F5-TTS.git
|
20 |
+
|
21 |
+
|
22 |
+
model_id = "TVI/f5-tts-ru-accent"
|
23 |
+
download_dir = "ckpts" # You can replace
|
24 |
+
|
25 |
+
!huggingface-cli download {model_id} --local-dir {download_dir}
|
26 |
+
|
27 |
+
|
28 |
+
model = "F5TTS_v1_Base"
|
29 |
+
ckpt_file = "/content/ckpts/model_last.safetensors"
|
30 |
+
vocab_file = "/content/ckpts/vocab.txt"
|
31 |
+
ref_audio = "PATH_TO_REF"
|
32 |
+
ref_text = f"REF TRANSCRIBE or EMPTY"
|
33 |
+
gen_text = "YOUR TEXT"
|
34 |
+
wav_output_dir = "OUTPUT_FOLDER"
|
35 |
+
wav_output_filename = "OUTPUT_FILE.wav"
|
36 |
+
speed = 1.0
|
37 |
+
|
38 |
+
command = (
|
39 |
+
f'f5-tts_infer-cli --model {model} --ckpt_file "{ckpt_file}" '
|
40 |
+
f'--vocab_file "{vocab_file}" -r "{ref_audio}" -s "{ref_text}" '
|
41 |
+
f'-t "{gen_text}" -o "{wav_output_dir}" -w "{wav_output_filename}" '
|
42 |
+
f'--speed {speed} --remove_silence'
|
43 |
+
)
|
44 |
+
|
45 |
+
print(command)
|
46 |
+
|
47 |
+
!{command}
|
48 |
+
|
49 |
+
```
|
50 |
+
|
51 |
Original repo: https://github.com/SWivid/F5-TTS
|