Spaces:
Running
on
Zero
Running
on
Zero
mrfakename
commited on
Commit
•
27cee60
1
Parent(s):
ea89faa
Sync from GitHub repo
Browse filesThis Space is synced from the GitHub repo: https://github.com/SWivid/F5-TTS. Please submit contributions to the Space there
pyproject.toml
CHANGED
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4 |
|
5 |
[project]
|
6 |
name = "f5-tts"
|
7 |
-
version = "0.2.
|
8 |
description = "F5-TTS: A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching"
|
9 |
readme = "README.md"
|
10 |
license = {text = "MIT License"}
|
|
|
4 |
|
5 |
[project]
|
6 |
name = "f5-tts"
|
7 |
+
version = "0.2.1"
|
8 |
description = "F5-TTS: A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching"
|
9 |
readme = "README.md"
|
10 |
license = {text = "MIT License"}
|
src/f5_tts/configs/E2TTS_Base_train.yaml
CHANGED
@@ -33,8 +33,9 @@ model:
|
|
33 |
win_length: 1024
|
34 |
n_fft: 1024
|
35 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
36 |
-
|
37 |
-
|
|
|
38 |
|
39 |
ckpts:
|
40 |
logger: wandb # wandb | tensorboard | None
|
|
|
33 |
win_length: 1024
|
34 |
n_fft: 1024
|
35 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
36 |
+
vocoder:
|
37 |
+
is_local: False # use local offline ckpt or not
|
38 |
+
local_path: None # local vocoder path
|
39 |
|
40 |
ckpts:
|
41 |
logger: wandb # wandb | tensorboard | None
|
src/f5_tts/configs/E2TTS_Small_train.yaml
CHANGED
@@ -33,8 +33,9 @@ model:
|
|
33 |
win_length: 1024
|
34 |
n_fft: 1024
|
35 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
36 |
-
|
37 |
-
|
|
|
38 |
|
39 |
ckpts:
|
40 |
logger: wandb # wandb | tensorboard | None
|
|
|
33 |
win_length: 1024
|
34 |
n_fft: 1024
|
35 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
36 |
+
vocoder:
|
37 |
+
is_local: False # use local offline ckpt or not
|
38 |
+
local_path: None # local vocoder path
|
39 |
|
40 |
ckpts:
|
41 |
logger: wandb # wandb | tensorboard | None
|
src/f5_tts/configs/F5TTS_Base_train.yaml
CHANGED
@@ -35,8 +35,9 @@ model:
|
|
35 |
win_length: 1024
|
36 |
n_fft: 1024
|
37 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
38 |
-
|
39 |
-
|
|
|
40 |
|
41 |
ckpts:
|
42 |
logger: wandb # wandb | tensorboard | None
|
|
|
35 |
win_length: 1024
|
36 |
n_fft: 1024
|
37 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
38 |
+
vocoder:
|
39 |
+
is_local: False # use local offline ckpt or not
|
40 |
+
local_path: None # local vocoder path
|
41 |
|
42 |
ckpts:
|
43 |
logger: wandb # wandb | tensorboard | None
|
src/f5_tts/configs/F5TTS_Small_train.yaml
CHANGED
@@ -35,8 +35,9 @@ model:
|
|
35 |
win_length: 1024
|
36 |
n_fft: 1024
|
37 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
38 |
-
|
39 |
-
|
|
|
40 |
|
41 |
ckpts:
|
42 |
logger: wandb # wandb | tensorboard | None
|
|
|
35 |
win_length: 1024
|
36 |
n_fft: 1024
|
37 |
mel_spec_type: vocos # 'vocos' or 'bigvgan'
|
38 |
+
vocoder:
|
39 |
+
is_local: False # use local offline ckpt or not
|
40 |
+
local_path: None # local vocoder path
|
41 |
|
42 |
ckpts:
|
43 |
logger: wandb # wandb | tensorboard | None
|
src/f5_tts/train/train.py
CHANGED
@@ -59,8 +59,8 @@ def main(cfg):
|
|
59 |
log_samples=True,
|
60 |
bnb_optimizer=cfg.optim.bnb_optimizer,
|
61 |
mel_spec_type=mel_spec_type,
|
62 |
-
is_local_vocoder=cfg.model.
|
63 |
-
local_vocoder_path=cfg.model.
|
64 |
)
|
65 |
|
66 |
train_dataset = load_dataset(cfg.datasets.name, tokenizer, mel_spec_kwargs=cfg.model.mel_spec)
|
|
|
59 |
log_samples=True,
|
60 |
bnb_optimizer=cfg.optim.bnb_optimizer,
|
61 |
mel_spec_type=mel_spec_type,
|
62 |
+
is_local_vocoder=cfg.model.vocoder.is_local,
|
63 |
+
local_vocoder_path=cfg.model.vocoder.local_path,
|
64 |
)
|
65 |
|
66 |
train_dataset = load_dataset(cfg.datasets.name, tokenizer, mel_spec_kwargs=cfg.model.mel_spec)
|