Sync from GitHub repo
Browse filesThis Space is synced from the GitHub repo: https://github.com/SWivid/F5-TTS. Please submit contributions to the Space there
pyproject.toml
CHANGED
|
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
| 4 |
|
| 5 |
[project]
|
| 6 |
name = "f5-tts"
|
| 7 |
-
version = "0.2.
|
| 8 |
description = "F5-TTS: A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching"
|
| 9 |
readme = "README.md"
|
| 10 |
license = {text = "MIT License"}
|
|
|
|
| 4 |
|
| 5 |
[project]
|
| 6 |
name = "f5-tts"
|
| 7 |
+
version = "0.2.1"
|
| 8 |
description = "F5-TTS: A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching"
|
| 9 |
readme = "README.md"
|
| 10 |
license = {text = "MIT License"}
|
src/f5_tts/configs/E2TTS_Base_train.yaml
CHANGED
|
@@ -33,8 +33,9 @@ model:
|
|
| 33 |
win_length: 1024
|
| 34 |
n_fft: 1024
|
| 35 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
| 36 |
-
|
| 37 |
-
|
|
|
|
| 38 |
|
| 39 |
ckpts:
|
| 40 |
logger: wandb # wandb | tensorboard | None
|
|
|
|
| 33 |
win_length: 1024
|
| 34 |
n_fft: 1024
|
| 35 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
| 36 |
+
vocoder:
|
| 37 |
+
is_local: False # use local offline ckpt or not
|
| 38 |
+
local_path: None # local vocoder path
|
| 39 |
|
| 40 |
ckpts:
|
| 41 |
logger: wandb # wandb | tensorboard | None
|
src/f5_tts/configs/E2TTS_Small_train.yaml
CHANGED
|
@@ -33,8 +33,9 @@ model:
|
|
| 33 |
win_length: 1024
|
| 34 |
n_fft: 1024
|
| 35 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
| 36 |
-
|
| 37 |
-
|
|
|
|
| 38 |
|
| 39 |
ckpts:
|
| 40 |
logger: wandb # wandb | tensorboard | None
|
|
|
|
| 33 |
win_length: 1024
|
| 34 |
n_fft: 1024
|
| 35 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
| 36 |
+
vocoder:
|
| 37 |
+
is_local: False # use local offline ckpt or not
|
| 38 |
+
local_path: None # local vocoder path
|
| 39 |
|
| 40 |
ckpts:
|
| 41 |
logger: wandb # wandb | tensorboard | None
|
src/f5_tts/configs/F5TTS_Base_train.yaml
CHANGED
|
@@ -35,8 +35,9 @@ model:
|
|
| 35 |
win_length: 1024
|
| 36 |
n_fft: 1024
|
| 37 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
| 38 |
-
|
| 39 |
-
|
|
|
|
| 40 |
|
| 41 |
ckpts:
|
| 42 |
logger: wandb # wandb | tensorboard | None
|
|
|
|
| 35 |
win_length: 1024
|
| 36 |
n_fft: 1024
|
| 37 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
| 38 |
+
vocoder:
|
| 39 |
+
is_local: False # use local offline ckpt or not
|
| 40 |
+
local_path: None # local vocoder path
|
| 41 |
|
| 42 |
ckpts:
|
| 43 |
logger: wandb # wandb | tensorboard | None
|
src/f5_tts/configs/F5TTS_Small_train.yaml
CHANGED
|
@@ -35,8 +35,9 @@ model:
|
|
| 35 |
win_length: 1024
|
| 36 |
n_fft: 1024
|
| 37 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
| 38 |
-
|
| 39 |
-
|
|
|
|
| 40 |
|
| 41 |
ckpts:
|
| 42 |
logger: wandb # wandb | tensorboard | None
|
|
|
|
| 35 |
win_length: 1024
|
| 36 |
n_fft: 1024
|
| 37 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
| 38 |
+
vocoder:
|
| 39 |
+
is_local: False # use local offline ckpt or not
|
| 40 |
+
local_path: None # local vocoder path
|
| 41 |
|
| 42 |
ckpts:
|
| 43 |
logger: wandb # wandb | tensorboard | None
|
src/f5_tts/train/train.py
CHANGED
|
@@ -59,8 +59,8 @@ def main(cfg):
|
|
| 59 |
log_samples=True,
|
| 60 |
bnb_optimizer=cfg.optim.bnb_optimizer,
|
| 61 |
mel_spec_type=mel_spec_type,
|
| 62 |
-
is_local_vocoder=cfg.model.
|
| 63 |
-
local_vocoder_path=cfg.model.
|
| 64 |
)
|
| 65 |
|
| 66 |
train_dataset = load_dataset(cfg.datasets.name, tokenizer, mel_spec_kwargs=cfg.model.mel_spec)
|
|
|
|
| 59 |
log_samples=True,
|
| 60 |
bnb_optimizer=cfg.optim.bnb_optimizer,
|
| 61 |
mel_spec_type=mel_spec_type,
|
| 62 |
+
is_local_vocoder=cfg.model.vocoder.is_local,
|
| 63 |
+
local_vocoder_path=cfg.model.vocoder.local_path,
|
| 64 |
)
|
| 65 |
|
| 66 |
train_dataset = load_dataset(cfg.datasets.name, tokenizer, mel_spec_kwargs=cfg.model.mel_spec)
|