mrfakename commited on
Commit
27cee60
1 Parent(s): ea89faa

Sync from GitHub repo

Browse files

This Space is synced from the GitHub repo: https://github.com/SWivid/F5-TTS. Please submit contributions to the Space there

pyproject.toml CHANGED
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
 
5
  [project]
6
  name = "f5-tts"
7
- version = "0.2.0"
8
  description = "F5-TTS: A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching"
9
  readme = "README.md"
10
  license = {text = "MIT License"}
 
4
 
5
  [project]
6
  name = "f5-tts"
7
+ version = "0.2.1"
8
  description = "F5-TTS: A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching"
9
  readme = "README.md"
10
  license = {text = "MIT License"}
src/f5_tts/configs/E2TTS_Base_train.yaml CHANGED
@@ -33,8 +33,9 @@ model:
33
  win_length: 1024
34
  n_fft: 1024
35
  mel_spec_type: vocos # 'vocos' or 'bigvgan'
36
- is_local_vocoder: False # use local offline vocoder ckpt or not
37
- local_vocoder_path: None # path to local vocoder
 
38
 
39
  ckpts:
40
  logger: wandb # wandb | tensorboard | None
 
33
  win_length: 1024
34
  n_fft: 1024
35
  mel_spec_type: vocos # 'vocos' or 'bigvgan'
36
+ vocoder:
37
+ is_local: False # use local offline ckpt or not
38
+ local_path: None # local vocoder path
39
 
40
  ckpts:
41
  logger: wandb # wandb | tensorboard | None
src/f5_tts/configs/E2TTS_Small_train.yaml CHANGED
@@ -33,8 +33,9 @@ model:
33
  win_length: 1024
34
  n_fft: 1024
35
  mel_spec_type: vocos # 'vocos' or 'bigvgan'
36
- is_local_vocoder: False
37
- local_vocoder_path: None
 
38
 
39
  ckpts:
40
  logger: wandb # wandb | tensorboard | None
 
33
  win_length: 1024
34
  n_fft: 1024
35
  mel_spec_type: vocos # 'vocos' or 'bigvgan'
36
+ vocoder:
37
+ is_local: False # use local offline ckpt or not
38
+ local_path: None # local vocoder path
39
 
40
  ckpts:
41
  logger: wandb # wandb | tensorboard | None
src/f5_tts/configs/F5TTS_Base_train.yaml CHANGED
@@ -35,8 +35,9 @@ model:
35
  win_length: 1024
36
  n_fft: 1024
37
  mel_spec_type: vocos # 'vocos' or 'bigvgan'
38
- is_local_vocoder: False # use local offline vocoder ckpt or not
39
- local_vocoder_path: None # local vocoder path
 
40
 
41
  ckpts:
42
  logger: wandb # wandb | tensorboard | None
 
35
  win_length: 1024
36
  n_fft: 1024
37
  mel_spec_type: vocos # 'vocos' or 'bigvgan'
38
+ vocoder:
39
+ is_local: False # use local offline ckpt or not
40
+ local_path: None # local vocoder path
41
 
42
  ckpts:
43
  logger: wandb # wandb | tensorboard | None
src/f5_tts/configs/F5TTS_Small_train.yaml CHANGED
@@ -35,8 +35,9 @@ model:
35
  win_length: 1024
36
  n_fft: 1024
37
  mel_spec_type: vocos # 'vocos' or 'bigvgan'
38
- is_local_vocoder: False
39
- local_vocoder_path: None
 
40
 
41
  ckpts:
42
  logger: wandb # wandb | tensorboard | None
 
35
  win_length: 1024
36
  n_fft: 1024
37
  mel_spec_type: vocos # 'vocos' or 'bigvgan'
38
+ vocoder:
39
+ is_local: False # use local offline ckpt or not
40
+ local_path: None # local vocoder path
41
 
42
  ckpts:
43
  logger: wandb # wandb | tensorboard | None
src/f5_tts/train/train.py CHANGED
@@ -59,8 +59,8 @@ def main(cfg):
59
  log_samples=True,
60
  bnb_optimizer=cfg.optim.bnb_optimizer,
61
  mel_spec_type=mel_spec_type,
62
- is_local_vocoder=cfg.model.mel_spec.is_local_vocoder,
63
- local_vocoder_path=cfg.model.mel_spec.local_vocoder_path,
64
  )
65
 
66
  train_dataset = load_dataset(cfg.datasets.name, tokenizer, mel_spec_kwargs=cfg.model.mel_spec)
 
59
  log_samples=True,
60
  bnb_optimizer=cfg.optim.bnb_optimizer,
61
  mel_spec_type=mel_spec_type,
62
+ is_local_vocoder=cfg.model.vocoder.is_local,
63
+ local_vocoder_path=cfg.model.vocoder.local_path,
64
  )
65
 
66
  train_dataset = load_dataset(cfg.datasets.name, tokenizer, mel_spec_kwargs=cfg.model.mel_spec)