start
Browse files- .hydra/config.yaml +131 -0
- .hydra/hydra.yaml +182 -0
- .hydra/overrides.yaml +1 -0
- checkpoints/last.ckpt +3 -0
- config_tree.log +145 -0
- data/train.txt +0 -0
- data/valid.txt +24 -0
- tags.log +1 -0
- tensorboard/version_0/events.out.tfevents.1729448606.b9cbd4f2ed3e.1163.0 +3 -0
- tensorboard/version_0/hparams.yaml +117 -0
- train.log +13 -0
.hydra/config.yaml
ADDED
@@ -0,0 +1,131 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
task_name: train
|
2 |
+
run_name: anna
|
3 |
+
tags:
|
4 |
+
- nabucasa
|
5 |
+
- hungarian
|
6 |
+
- anna
|
7 |
+
train: true
|
8 |
+
test: true
|
9 |
+
ckpt_path: null
|
10 |
+
seed: 1234
|
11 |
+
data:
|
12 |
+
_target_: matcha.data.text_mel_datamodule.TextMelDataModule
|
13 |
+
name: nabucasa_anna
|
14 |
+
train_filelist_path: data/nabucasa_anna/train.txt
|
15 |
+
valid_filelist_path: data/nabucasa_anna/valid.txt
|
16 |
+
batch_size: 32
|
17 |
+
num_workers: 20
|
18 |
+
pin_memory: true
|
19 |
+
cleaners:
|
20 |
+
- hungarian_cleaners
|
21 |
+
add_blank: true
|
22 |
+
n_spks: 1
|
23 |
+
n_fft: 1024
|
24 |
+
n_feats: 80
|
25 |
+
sample_rate: 22050
|
26 |
+
hop_length: 256
|
27 |
+
win_length: 1024
|
28 |
+
f_min: 0
|
29 |
+
f_max: 8000
|
30 |
+
data_statistics:
|
31 |
+
mel_mean: -6.346419334411621
|
32 |
+
mel_std: 2.677656650543213
|
33 |
+
seed: ${seed}
|
34 |
+
load_durations: false
|
35 |
+
model:
|
36 |
+
_target_: matcha.models.matcha_tts.MatchaTTS
|
37 |
+
n_vocab: 178
|
38 |
+
n_spks: ${data.n_spks}
|
39 |
+
spk_emb_dim: 64
|
40 |
+
n_feats: 80
|
41 |
+
data_statistics: ${data.data_statistics}
|
42 |
+
out_size: null
|
43 |
+
prior_loss: true
|
44 |
+
use_precomputed_durations: ${data.load_durations}
|
45 |
+
encoder:
|
46 |
+
encoder_type: RoPE Encoder
|
47 |
+
encoder_params:
|
48 |
+
n_feats: ${model.n_feats}
|
49 |
+
n_channels: 192
|
50 |
+
filter_channels: 768
|
51 |
+
filter_channels_dp: 256
|
52 |
+
n_heads: 2
|
53 |
+
n_layers: 6
|
54 |
+
kernel_size: 3
|
55 |
+
p_dropout: 0.1
|
56 |
+
spk_emb_dim: 64
|
57 |
+
n_spks: 1
|
58 |
+
prenet: true
|
59 |
+
duration_predictor_params:
|
60 |
+
filter_channels_dp: ${model.encoder.encoder_params.filter_channels_dp}
|
61 |
+
kernel_size: 3
|
62 |
+
p_dropout: ${model.encoder.encoder_params.p_dropout}
|
63 |
+
decoder:
|
64 |
+
channels:
|
65 |
+
- 256
|
66 |
+
- 256
|
67 |
+
dropout: 0.05
|
68 |
+
attention_head_dim: 64
|
69 |
+
n_blocks: 1
|
70 |
+
num_mid_blocks: 2
|
71 |
+
num_heads: 2
|
72 |
+
act_fn: snakebeta
|
73 |
+
cfm:
|
74 |
+
name: CFM
|
75 |
+
solver: euler
|
76 |
+
sigma_min: 0.0001
|
77 |
+
optimizer:
|
78 |
+
_target_: torch.optim.Adam
|
79 |
+
_partial_: true
|
80 |
+
lr: 0.0001
|
81 |
+
weight_decay: 0.0
|
82 |
+
callbacks:
|
83 |
+
model_checkpoint:
|
84 |
+
_target_: lightning.pytorch.callbacks.ModelCheckpoint
|
85 |
+
dirpath: ${paths.output_dir}/checkpoints
|
86 |
+
filename: checkpoint_{epoch:03d}
|
87 |
+
monitor: epoch
|
88 |
+
verbose: false
|
89 |
+
save_last: true
|
90 |
+
save_top_k: 10
|
91 |
+
mode: max
|
92 |
+
auto_insert_metric_name: true
|
93 |
+
save_weights_only: false
|
94 |
+
every_n_train_steps: null
|
95 |
+
train_time_interval: null
|
96 |
+
every_n_epochs: 100
|
97 |
+
save_on_train_epoch_end: null
|
98 |
+
model_summary:
|
99 |
+
_target_: lightning.pytorch.callbacks.RichModelSummary
|
100 |
+
max_depth: 3
|
101 |
+
rich_progress_bar:
|
102 |
+
_target_: lightning.pytorch.callbacks.RichProgressBar
|
103 |
+
logger:
|
104 |
+
tensorboard:
|
105 |
+
_target_: lightning.pytorch.loggers.tensorboard.TensorBoardLogger
|
106 |
+
save_dir: ${paths.output_dir}/tensorboard/
|
107 |
+
name: null
|
108 |
+
log_graph: false
|
109 |
+
default_hp_metric: true
|
110 |
+
prefix: ''
|
111 |
+
trainer:
|
112 |
+
_target_: lightning.pytorch.trainer.Trainer
|
113 |
+
default_root_dir: ${paths.output_dir}
|
114 |
+
max_epochs: -1
|
115 |
+
accelerator: gpu
|
116 |
+
devices:
|
117 |
+
- 0
|
118 |
+
precision: 16-mixed
|
119 |
+
check_val_every_n_epoch: 1
|
120 |
+
deterministic: false
|
121 |
+
gradient_clip_val: 5.0
|
122 |
+
paths:
|
123 |
+
root_dir: ${oc.env:PROJECT_ROOT}
|
124 |
+
data_dir: ${paths.root_dir}/data/
|
125 |
+
log_dir: ${paths.root_dir}/logs/
|
126 |
+
output_dir: ${hydra:runtime.output_dir}
|
127 |
+
work_dir: ${hydra:runtime.cwd}
|
128 |
+
extras:
|
129 |
+
ignore_warnings: false
|
130 |
+
enforce_tags: true
|
131 |
+
print_config: true
|
.hydra/hydra.yaml
ADDED
@@ -0,0 +1,182 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
hydra:
|
2 |
+
run:
|
3 |
+
dir: ${paths.log_dir}/${task_name}/${run_name}/runs/${now:%Y-%m-%d}_${now:%H-%M-%S}
|
4 |
+
sweep:
|
5 |
+
dir: ${paths.log_dir}/${task_name}/${run_name}/multiruns/${now:%Y-%m-%d}_${now:%H-%M-%S}
|
6 |
+
subdir: ${hydra.job.num}
|
7 |
+
launcher:
|
8 |
+
_target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
|
9 |
+
sweeper:
|
10 |
+
_target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
|
11 |
+
max_batch_size: null
|
12 |
+
params: null
|
13 |
+
help:
|
14 |
+
app_name: ${hydra.job.name}
|
15 |
+
header: '${hydra.help.app_name} is powered by Hydra.
|
16 |
+
|
17 |
+
'
|
18 |
+
footer: 'Powered by Hydra (https://hydra.cc)
|
19 |
+
|
20 |
+
Use --hydra-help to view Hydra specific help
|
21 |
+
|
22 |
+
'
|
23 |
+
template: '${hydra.help.header}
|
24 |
+
|
25 |
+
== Configuration groups ==
|
26 |
+
|
27 |
+
Compose your configuration from those groups (group=option)
|
28 |
+
|
29 |
+
|
30 |
+
$APP_CONFIG_GROUPS
|
31 |
+
|
32 |
+
|
33 |
+
== Config ==
|
34 |
+
|
35 |
+
Override anything in the config (foo.bar=value)
|
36 |
+
|
37 |
+
|
38 |
+
$CONFIG
|
39 |
+
|
40 |
+
|
41 |
+
${hydra.help.footer}
|
42 |
+
|
43 |
+
'
|
44 |
+
hydra_help:
|
45 |
+
template: 'Hydra (${hydra.runtime.version})
|
46 |
+
|
47 |
+
See https://hydra.cc for more info.
|
48 |
+
|
49 |
+
|
50 |
+
== Flags ==
|
51 |
+
|
52 |
+
$FLAGS_HELP
|
53 |
+
|
54 |
+
|
55 |
+
== Configuration groups ==
|
56 |
+
|
57 |
+
Compose your configuration from those groups (For example, append hydra/job_logging=disabled
|
58 |
+
to command line)
|
59 |
+
|
60 |
+
|
61 |
+
$HYDRA_CONFIG_GROUPS
|
62 |
+
|
63 |
+
|
64 |
+
Use ''--cfg hydra'' to Show the Hydra config.
|
65 |
+
|
66 |
+
'
|
67 |
+
hydra_help: ???
|
68 |
+
hydra_logging:
|
69 |
+
version: 1
|
70 |
+
formatters:
|
71 |
+
colorlog:
|
72 |
+
(): colorlog.ColoredFormatter
|
73 |
+
format: '[%(cyan)s%(asctime)s%(reset)s][%(purple)sHYDRA%(reset)s] %(message)s'
|
74 |
+
handlers:
|
75 |
+
console:
|
76 |
+
class: logging.StreamHandler
|
77 |
+
formatter: colorlog
|
78 |
+
stream: ext://sys.stdout
|
79 |
+
root:
|
80 |
+
level: INFO
|
81 |
+
handlers:
|
82 |
+
- console
|
83 |
+
disable_existing_loggers: false
|
84 |
+
job_logging:
|
85 |
+
version: 1
|
86 |
+
formatters:
|
87 |
+
simple:
|
88 |
+
format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
|
89 |
+
colorlog:
|
90 |
+
(): colorlog.ColoredFormatter
|
91 |
+
format: '[%(cyan)s%(asctime)s%(reset)s][%(blue)s%(name)s%(reset)s][%(log_color)s%(levelname)s%(reset)s]
|
92 |
+
- %(message)s'
|
93 |
+
log_colors:
|
94 |
+
DEBUG: purple
|
95 |
+
INFO: green
|
96 |
+
WARNING: yellow
|
97 |
+
ERROR: red
|
98 |
+
CRITICAL: red
|
99 |
+
handlers:
|
100 |
+
console:
|
101 |
+
class: logging.StreamHandler
|
102 |
+
formatter: colorlog
|
103 |
+
stream: ext://sys.stdout
|
104 |
+
file:
|
105 |
+
class: logging.FileHandler
|
106 |
+
formatter: simple
|
107 |
+
filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
|
108 |
+
root:
|
109 |
+
level: INFO
|
110 |
+
handlers:
|
111 |
+
- console
|
112 |
+
- file
|
113 |
+
disable_existing_loggers: false
|
114 |
+
env: {}
|
115 |
+
mode: RUN
|
116 |
+
searchpath: []
|
117 |
+
callbacks: {}
|
118 |
+
output_subdir: .hydra
|
119 |
+
overrides:
|
120 |
+
hydra:
|
121 |
+
- hydra.mode=RUN
|
122 |
+
task:
|
123 |
+
- experiment=anna
|
124 |
+
job:
|
125 |
+
name: train
|
126 |
+
chdir: null
|
127 |
+
override_dirname: experiment=anna
|
128 |
+
id: ???
|
129 |
+
num: ???
|
130 |
+
config_name: train.yaml
|
131 |
+
env_set: {}
|
132 |
+
env_copy: []
|
133 |
+
config:
|
134 |
+
override_dirname:
|
135 |
+
kv_sep: '='
|
136 |
+
item_sep: ','
|
137 |
+
exclude_keys: []
|
138 |
+
runtime:
|
139 |
+
version: 1.3.2
|
140 |
+
version_base: '1.3'
|
141 |
+
cwd: /workspace/Matcha-TTS
|
142 |
+
config_sources:
|
143 |
+
- path: hydra.conf
|
144 |
+
schema: pkg
|
145 |
+
provider: hydra
|
146 |
+
- path: /workspace/Matcha-TTS/configs
|
147 |
+
schema: file
|
148 |
+
provider: main
|
149 |
+
- path: hydra_plugins.hydra_colorlog.conf
|
150 |
+
schema: pkg
|
151 |
+
provider: hydra-colorlog
|
152 |
+
- path: ''
|
153 |
+
schema: structured
|
154 |
+
provider: schema
|
155 |
+
output_dir: /workspace/Matcha-TTS/logs/train/anna/runs/2024-10-20_18-23-24
|
156 |
+
choices:
|
157 |
+
debug: null
|
158 |
+
local: default
|
159 |
+
hparams_search: null
|
160 |
+
experiment: anna
|
161 |
+
hydra: default
|
162 |
+
extras: default
|
163 |
+
paths: default
|
164 |
+
trainer: default
|
165 |
+
logger: tensorboard
|
166 |
+
callbacks: default
|
167 |
+
model: matcha
|
168 |
+
model/optimizer: adam.yaml
|
169 |
+
model/cfm: default.yaml
|
170 |
+
model/decoder: default.yaml
|
171 |
+
model/encoder: default.yaml
|
172 |
+
data: nabucasa_anna.yaml
|
173 |
+
hydra/env: default
|
174 |
+
hydra/callbacks: null
|
175 |
+
hydra/job_logging: colorlog
|
176 |
+
hydra/hydra_logging: colorlog
|
177 |
+
hydra/hydra_help: default
|
178 |
+
hydra/help: default
|
179 |
+
hydra/sweeper: basic
|
180 |
+
hydra/launcher: basic
|
181 |
+
hydra/output: default
|
182 |
+
verbose: false
|
.hydra/overrides.yaml
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
- experiment=anna
|
checkpoints/last.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18235b00378cd8de238238006c26697df650cc36d581b2f47eebd603476876c8
|
3 |
+
size 218838731
|
config_tree.log
ADDED
@@ -0,0 +1,145 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
CONFIG
|
2 |
+
├── data
|
3 |
+
│ └── _target_: matcha.data.text_mel_datamodule.TextMelDataModule
|
4 |
+
│ name: nabucasa_anna
|
5 |
+
│ train_filelist_path: data/nabucasa_anna/train.txt
|
6 |
+
│ valid_filelist_path: data/nabucasa_anna/valid.txt
|
7 |
+
│ batch_size: 32
|
8 |
+
│ num_workers: 20
|
9 |
+
│ pin_memory: true
|
10 |
+
│ cleaners:
|
11 |
+
│ - hungarian_cleaners
|
12 |
+
│ add_blank: true
|
13 |
+
│ n_spks: 1
|
14 |
+
│ n_fft: 1024
|
15 |
+
│ n_feats: 80
|
16 |
+
│ sample_rate: 22050
|
17 |
+
│ hop_length: 256
|
18 |
+
│ win_length: 1024
|
19 |
+
│ f_min: 0
|
20 |
+
│ f_max: 8000
|
21 |
+
│ data_statistics:
|
22 |
+
│ mel_mean: -6.346419334411621
|
23 |
+
│ mel_std: 2.677656650543213
|
24 |
+
│ seed: 1234
|
25 |
+
│ load_durations: false
|
26 |
+
│
|
27 |
+
├── model
|
28 |
+
│ └── _target_: matcha.models.matcha_tts.MatchaTTS
|
29 |
+
│ n_vocab: 178
|
30 |
+
│ n_spks: 1
|
31 |
+
│ spk_emb_dim: 64
|
32 |
+
│ n_feats: 80
|
33 |
+
│ data_statistics:
|
34 |
+
│ mel_mean: -6.346419334411621
|
35 |
+
│ mel_std: 2.677656650543213
|
36 |
+
│ out_size: null
|
37 |
+
│ prior_loss: true
|
38 |
+
│ use_precomputed_durations: false
|
39 |
+
│ encoder:
|
40 |
+
│ encoder_type: RoPE Encoder
|
41 |
+
│ encoder_params:
|
42 |
+
│ n_feats: 80
|
43 |
+
│ n_channels: 192
|
44 |
+
│ filter_channels: 768
|
45 |
+
│ filter_channels_dp: 256
|
46 |
+
│ n_heads: 2
|
47 |
+
│ n_layers: 6
|
48 |
+
│ kernel_size: 3
|
49 |
+
│ p_dropout: 0.1
|
50 |
+
│ spk_emb_dim: 64
|
51 |
+
│ n_spks: 1
|
52 |
+
│ prenet: true
|
53 |
+
│ duration_predictor_params:
|
54 |
+
│ filter_channels_dp: 256
|
55 |
+
│ kernel_size: 3
|
56 |
+
│ p_dropout: 0.1
|
57 |
+
│ decoder:
|
58 |
+
│ channels:
|
59 |
+
│ - 256
|
60 |
+
│ - 256
|
61 |
+
│ dropout: 0.05
|
62 |
+
│ attention_head_dim: 64
|
63 |
+
│ n_blocks: 1
|
64 |
+
│ num_mid_blocks: 2
|
65 |
+
│ num_heads: 2
|
66 |
+
│ act_fn: snakebeta
|
67 |
+
│ cfm:
|
68 |
+
│ name: CFM
|
69 |
+
│ solver: euler
|
70 |
+
│ sigma_min: 0.0001
|
71 |
+
│ optimizer:
|
72 |
+
│ _target_: torch.optim.Adam
|
73 |
+
│ _partial_: true
|
74 |
+
│ lr: 0.0001
|
75 |
+
│ weight_decay: 0.0
|
76 |
+
│
|
77 |
+
├── callbacks
|
78 |
+
│ └── model_checkpoint:
|
79 |
+
│ _target_: lightning.pytorch.callbacks.ModelCheckpoint
|
80 |
+
│ dirpath: /workspace/Matcha-TTS/logs/train/anna/runs/2024-10-20_18-23-2
|
81 |
+
│ filename: checkpoint_{epoch:03d}
|
82 |
+
│ monitor: epoch
|
83 |
+
│ verbose: false
|
84 |
+
│ save_last: true
|
85 |
+
│ save_top_k: 10
|
86 |
+
│ mode: max
|
87 |
+
│ auto_insert_metric_name: true
|
88 |
+
│ save_weights_only: false
|
89 |
+
│ every_n_train_steps: null
|
90 |
+
│ train_time_interval: null
|
91 |
+
│ every_n_epochs: 100
|
92 |
+
│ save_on_train_epoch_end: null
|
93 |
+
│ model_summary:
|
94 |
+
│ _target_: lightning.pytorch.callbacks.RichModelSummary
|
95 |
+
│ max_depth: 3
|
96 |
+
│ rich_progress_bar:
|
97 |
+
│ _target_: lightning.pytorch.callbacks.RichProgressBar
|
98 |
+
│
|
99 |
+
├── logger
|
100 |
+
│ └── tensorboard:
|
101 |
+
│ _target_: lightning.pytorch.loggers.tensorboard.TensorBoardLogger
|
102 |
+
│ save_dir: /workspace/Matcha-TTS/logs/train/anna/runs/2024-10-20_18-23-
|
103 |
+
│ name: null
|
104 |
+
│ log_graph: false
|
105 |
+
│ default_hp_metric: true
|
106 |
+
│ prefix: ''
|
107 |
+
│
|
108 |
+
├── trainer
|
109 |
+
│ └── _target_: lightning.pytorch.trainer.Trainer
|
110 |
+
│ default_root_dir: /workspace/Matcha-TTS/logs/train/anna/runs/2024-10-20_
|
111 |
+
│ max_epochs: -1
|
112 |
+
│ accelerator: gpu
|
113 |
+
│ devices:
|
114 |
+
│ - 0
|
115 |
+
│ precision: 16-mixed
|
116 |
+
│ check_val_every_n_epoch: 1
|
117 |
+
│ deterministic: false
|
118 |
+
│ gradient_clip_val: 5.0
|
119 |
+
│
|
120 |
+
├── paths
|
121 |
+
│ └── root_dir: /workspace/Matcha-TTS
|
122 |
+
│ data_dir: /workspace/Matcha-TTS/data/
|
123 |
+
│ log_dir: /workspace/Matcha-TTS/logs/
|
124 |
+
│ output_dir: /workspace/Matcha-TTS/logs/train/anna/runs/2024-10-20_18-23-
|
125 |
+
│ work_dir: /workspace/Matcha-TTS
|
126 |
+
│
|
127 |
+
├── extras
|
128 |
+
│ └── ignore_warnings: false
|
129 |
+
│ enforce_tags: true
|
130 |
+
│ print_config: true
|
131 |
+
│
|
132 |
+
├── task_name
|
133 |
+
│ └── train
|
134 |
+
├── run_name
|
135 |
+
│ └── anna
|
136 |
+
├── tags
|
137 |
+
│ └── ['nabucasa', 'hungarian', 'anna']
|
138 |
+
├── train
|
139 |
+
│ └── True
|
140 |
+
├── test
|
141 |
+
│ └── True
|
142 |
+
├── ckpt_path
|
143 |
+
│ └── None
|
144 |
+
└── seed
|
145 |
+
└── 1234
|
data/train.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
data/valid.txt
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
data/nabucasa_anna/0000000001.wav|A színes manikűrök a fesztiválidőszakra tökéletesek lesznek, hiszen feltűnőek és izgalmasak, de abszolút elfogadható kereteken belül.
|
2 |
+
data/nabucasa_anna/0000000029.wav|Két tojás volt a sok salátalevél között, csak az vette észre, aki kifejezetten az én kajámat figyelte.
|
3 |
+
data/nabucasa_anna/0000000074.wav|Így amennyiben az átlagosnál nem csapadékosabb a tavasz és a nyárelő, komoly mezőgazdasági károk alakulhatnak ki, ahogy idén is.
|
4 |
+
data/nabucasa_anna/0000000179.wav|A kanapé az egyik legporosabb tárgy az otthonodban.
|
5 |
+
data/nabucasa_anna/0000000196.wav|Nem semmi történetet osztott meg egy vendég a neten.
|
6 |
+
data/nabucasa_anna/0100000004.wav|Egyéni célokat tűzött maga elé?
|
7 |
+
data/nabucasa_anna/0100000016.wav|De hát akkor ki írta?
|
8 |
+
data/nabucasa_anna/0100000081.wav|Jó, akkor mikor hívjon?
|
9 |
+
data/nabucasa_anna/0100000094.wav|Csapatban vagy egyedül érdemes futni?
|
10 |
+
data/nabucasa_anna/0200000003.wav|Ilyenkor konkrétan felismerhetetlenné válnak a számunkra amúgy jól ismert tárgyak!
|
11 |
+
data/nabucasa_anna/0200000066.wav|Szerencsés csillagzat alatt születtél, de nem csak ez az oka a sorozatos mázliknak!
|
12 |
+
data/nabucasa_anna/0300000046.wav|Melyik szóra gondoltál, hűtő mint H Ű T Ő vagy fűtő mint F Ű T Ő?
|
13 |
+
data/nabucasa_anna/3000000002.wav|Szia, ez nagyon jól hangzik, én is mehetek?
|
14 |
+
data/nabucasa_anna/3000000030.wav|Imádom a sivatagokat, ezért utazom ebbe az országba.
|
15 |
+
data/nabucasa_anna/3000000031.wav|A sivatagi táj lélegzetelállító, nekünk is el kellene menni.
|
16 |
+
data/nabucasa_anna/3000000037.wav|Spontán módon jobban szeretek utazni.
|
17 |
+
data/nabucasa_anna/3000000039.wav|Igen, holnap ötkor találkozunk a mozi előtt.
|
18 |
+
data/nabucasa_anna/3000000144.wav|Igen, szeretném tudni, hol voltál.
|
19 |
+
data/nabucasa_anna/3000000153.wav|Nekem is meg kell tanítanod ezt.
|
20 |
+
data/nabucasa_anna/3000000219.wav|Akkor megcsinálom, és kifizetem.
|
21 |
+
data/nabucasa_anna/3000000294.wav|Nagyon sajnálom, de pénzre van szükségem.
|
22 |
+
data/nabucasa_anna/4000000179.wav|Ön jogosult meghosszabbítani a garanciát további ötezer forint ellenében, kérjük nyilatkozzon a szándékáról.
|
23 |
+
data/nabucasa_anna/4000000189.wav|Ügyfeleink számára a lehető legjobb és könnyen adaptálható szolgáltatásra törekszünk.
|
24 |
+
data/nabucasa_anna/4000000236.wav|Az informatikus kolléga holnap tudja elhárítani a problémát, mert a készülék jelenleg nincs raktáron.
|
tags.log
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
['nabucasa', 'hungarian', 'anna']
|
tensorboard/version_0/events.out.tfevents.1729448606.b9cbd4f2ed3e.1163.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ada84686dc195843ebdb55b2d2d145f2928434c49a590869e8deb9460ec6e110
|
3 |
+
size 1468747
|
tensorboard/version_0/hparams.yaml
ADDED
@@ -0,0 +1,117 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
model:
|
2 |
+
_target_: matcha.models.matcha_tts.MatchaTTS
|
3 |
+
n_vocab: 178
|
4 |
+
n_spks: ${data.n_spks}
|
5 |
+
spk_emb_dim: 64
|
6 |
+
n_feats: 80
|
7 |
+
data_statistics: ${data.data_statistics}
|
8 |
+
out_size: null
|
9 |
+
prior_loss: true
|
10 |
+
use_precomputed_durations: ${data.load_durations}
|
11 |
+
encoder:
|
12 |
+
encoder_type: RoPE Encoder
|
13 |
+
encoder_params:
|
14 |
+
n_feats: ${model.n_feats}
|
15 |
+
n_channels: 192
|
16 |
+
filter_channels: 768
|
17 |
+
filter_channels_dp: 256
|
18 |
+
n_heads: 2
|
19 |
+
n_layers: 6
|
20 |
+
kernel_size: 3
|
21 |
+
p_dropout: 0.1
|
22 |
+
spk_emb_dim: 64
|
23 |
+
n_spks: 1
|
24 |
+
prenet: true
|
25 |
+
duration_predictor_params:
|
26 |
+
filter_channels_dp: ${model.encoder.encoder_params.filter_channels_dp}
|
27 |
+
kernel_size: 3
|
28 |
+
p_dropout: ${model.encoder.encoder_params.p_dropout}
|
29 |
+
decoder:
|
30 |
+
channels:
|
31 |
+
- 256
|
32 |
+
- 256
|
33 |
+
dropout: 0.05
|
34 |
+
attention_head_dim: 64
|
35 |
+
n_blocks: 1
|
36 |
+
num_mid_blocks: 2
|
37 |
+
num_heads: 2
|
38 |
+
act_fn: snakebeta
|
39 |
+
cfm:
|
40 |
+
name: CFM
|
41 |
+
solver: euler
|
42 |
+
sigma_min: 0.0001
|
43 |
+
optimizer:
|
44 |
+
_target_: torch.optim.Adam
|
45 |
+
_partial_: true
|
46 |
+
lr: 0.0001
|
47 |
+
weight_decay: 0.0
|
48 |
+
model/params/total: 18204193
|
49 |
+
model/params/trainable: 18204193
|
50 |
+
model/params/non_trainable: 0
|
51 |
+
data:
|
52 |
+
_target_: matcha.data.text_mel_datamodule.TextMelDataModule
|
53 |
+
name: nabucasa_anna
|
54 |
+
train_filelist_path: data/nabucasa_anna/train.txt
|
55 |
+
valid_filelist_path: data/nabucasa_anna/valid.txt
|
56 |
+
batch_size: 32
|
57 |
+
num_workers: 20
|
58 |
+
pin_memory: true
|
59 |
+
cleaners:
|
60 |
+
- hungarian_cleaners
|
61 |
+
add_blank: true
|
62 |
+
n_spks: 1
|
63 |
+
n_fft: 1024
|
64 |
+
n_feats: 80
|
65 |
+
sample_rate: 22050
|
66 |
+
hop_length: 256
|
67 |
+
win_length: 1024
|
68 |
+
f_min: 0
|
69 |
+
f_max: 8000
|
70 |
+
data_statistics:
|
71 |
+
mel_mean: -6.346419334411621
|
72 |
+
mel_std: 2.677656650543213
|
73 |
+
seed: ${seed}
|
74 |
+
load_durations: false
|
75 |
+
trainer:
|
76 |
+
_target_: lightning.pytorch.trainer.Trainer
|
77 |
+
default_root_dir: ${paths.output_dir}
|
78 |
+
max_epochs: -1
|
79 |
+
accelerator: gpu
|
80 |
+
devices:
|
81 |
+
- 0
|
82 |
+
precision: 16-mixed
|
83 |
+
check_val_every_n_epoch: 1
|
84 |
+
deterministic: false
|
85 |
+
gradient_clip_val: 5.0
|
86 |
+
callbacks:
|
87 |
+
model_checkpoint:
|
88 |
+
_target_: lightning.pytorch.callbacks.ModelCheckpoint
|
89 |
+
dirpath: ${paths.output_dir}/checkpoints
|
90 |
+
filename: checkpoint_{epoch:03d}
|
91 |
+
monitor: epoch
|
92 |
+
verbose: false
|
93 |
+
save_last: true
|
94 |
+
save_top_k: 10
|
95 |
+
mode: max
|
96 |
+
auto_insert_metric_name: true
|
97 |
+
save_weights_only: false
|
98 |
+
every_n_train_steps: null
|
99 |
+
train_time_interval: null
|
100 |
+
every_n_epochs: 100
|
101 |
+
save_on_train_epoch_end: null
|
102 |
+
model_summary:
|
103 |
+
_target_: lightning.pytorch.callbacks.RichModelSummary
|
104 |
+
max_depth: 3
|
105 |
+
rich_progress_bar:
|
106 |
+
_target_: lightning.pytorch.callbacks.RichProgressBar
|
107 |
+
extras:
|
108 |
+
ignore_warnings: false
|
109 |
+
enforce_tags: true
|
110 |
+
print_config: true
|
111 |
+
task_name: train
|
112 |
+
tags:
|
113 |
+
- nabucasa
|
114 |
+
- hungarian
|
115 |
+
- anna
|
116 |
+
ckpt_path: null
|
117 |
+
seed: 1234
|
train.log
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[2024-10-20 18:23:24,847][matcha.utils.utils][INFO] - Enforcing tags! <cfg.extras.enforce_tags=True>
|
2 |
+
[2024-10-20 18:23:24,853][matcha.utils.utils][INFO] - Printing config tree with Rich! <cfg.extras.print_config=True>
|
3 |
+
[2024-10-20 18:23:24,925][__main__][INFO] - Instantiating datamodule <matcha.data.text_mel_datamodule.TextMelDataModule>
|
4 |
+
[2024-10-20 18:23:25,425][__main__][INFO] - Instantiating model <matcha.models.matcha_tts.MatchaTTS>
|
5 |
+
[2024-10-20 18:23:26,071][__main__][INFO] - Instantiating callbacks...
|
6 |
+
[2024-10-20 18:23:26,071][matcha.utils.instantiators][INFO] - Instantiating callback <lightning.pytorch.callbacks.ModelCheckpoint>
|
7 |
+
[2024-10-20 18:23:26,075][matcha.utils.instantiators][INFO] - Instantiating callback <lightning.pytorch.callbacks.RichModelSummary>
|
8 |
+
[2024-10-20 18:23:26,076][matcha.utils.instantiators][INFO] - Instantiating callback <lightning.pytorch.callbacks.RichProgressBar>
|
9 |
+
[2024-10-20 18:23:26,077][__main__][INFO] - Instantiating loggers...
|
10 |
+
[2024-10-20 18:23:26,077][matcha.utils.instantiators][INFO] - Instantiating logger <lightning.pytorch.loggers.tensorboard.TensorBoardLogger>
|
11 |
+
[2024-10-20 18:23:26,082][__main__][INFO] - Instantiating trainer <lightning.pytorch.trainer.Trainer>
|
12 |
+
[2024-10-20 18:23:26,123][__main__][INFO] - Logging hyperparameters!
|
13 |
+
[2024-10-20 18:23:26,188][__main__][INFO] - Starting training!
|