Nyanmero commited on
Commit
2238638
·
verified ·
1 Parent(s): 4199b1b

Training in progress, step 5000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a07ff07864099795f0ef4d933d28ad9679ab08369382487621535abb56f31408
3
  size 577859976
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac561155f14c161be89688cbd6791c190ab41f1ce825521ecbfa6d19d6a0c5dc
3
  size 577859976
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa549d0c6d2379df26a07b7c3966ffb132bd6ae13022a5b02c772d9255bfb476
3
  size 1155913545
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:101e64149047c3d744fdcb436b5dba2ca98b22115ce1eff72b44b64343dda473
3
  size 1155913545
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d49f728245aa60e4fc9c5baaee9c0ba88b2cadcc8481faf5625d828b7dcb728
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b87c169cee0ea524ed1c27bb8054d01ebdc65124a471acea18a35e7102d6ec2
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d73d3175aefaa69aadf2bfd7a28a272f3f909699b9e8910d2a5b7143d3350e78
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:860361ada6eb369eac489bd111b66d88a5634713630c0b874711d0b984bd4e88
3
  size 1064
last-checkpoint/spm_char.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae27ad61041da617aec8ffe1c20890111b46b4a3cbb00984dac63f733f1004b9
3
  size 238738
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b531f1de35ab0170af3d23ae8a6e847481a4d0a40cde9036ea8160d511bf6b16
3
  size 238738
last-checkpoint/trainer_state.json CHANGED
@@ -1,169 +1,66 @@
1
  {
2
- "best_metric": 0.4254090189933777,
3
- "best_model_checkpoint": "./speecht5-tts-vie\\checkpoint-10000",
4
- "epoch": 20.408163265306122,
5
  "eval_steps": 1000,
6
- "global_step": 10000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 2.0408163265306123,
13
- "grad_norm": 1.8910266160964966,
14
- "learning_rate": 8.316666666666668e-06,
15
- "loss": 0.7092,
 
16
  "step": 1000
17
  },
18
  {
19
- "epoch": 2.0408163265306123,
20
- "eval_loss": 0.5270479917526245,
21
- "eval_runtime": 389.8964,
22
- "eval_samples_per_second": 17.212,
23
- "eval_steps_per_second": 0.539,
24
- "step": 1000
25
- },
26
- {
27
- "epoch": 4.081632653061225,
28
- "grad_norm": 1.5691834688186646,
29
- "learning_rate": 1.665e-05,
30
- "loss": 0.5566,
31
- "step": 2000
32
- },
33
- {
34
- "epoch": 4.081632653061225,
35
- "eval_loss": 0.48652538657188416,
36
- "eval_runtime": 379.2783,
37
- "eval_samples_per_second": 17.694,
38
- "eval_steps_per_second": 0.554,
39
  "step": 2000
40
  },
41
  {
42
- "epoch": 6.122448979591836,
43
- "grad_norm": 4.319777488708496,
44
- "learning_rate": 2.4983333333333335e-05,
45
- "loss": 0.5055,
46
- "step": 3000
47
- },
48
- {
49
- "epoch": 6.122448979591836,
50
- "eval_loss": 0.4476528465747833,
51
- "eval_runtime": 376.1339,
52
- "eval_samples_per_second": 17.842,
53
- "eval_steps_per_second": 0.558,
54
  "step": 3000
55
  },
56
  {
57
- "epoch": 8.16326530612245,
58
- "grad_norm": 3.316411256790161,
59
- "learning_rate": 3.3316666666666666e-05,
60
- "loss": 0.4789,
61
- "step": 4000
62
- },
63
- {
64
- "epoch": 8.16326530612245,
65
- "eval_loss": 0.4305626153945923,
66
- "eval_runtime": 379.5072,
67
- "eval_samples_per_second": 17.683,
68
- "eval_steps_per_second": 0.553,
69
  "step": 4000
70
  },
71
  {
72
- "epoch": 10.204081632653061,
73
- "grad_norm": 2.388119697570801,
74
  "learning_rate": 4.1641666666666665e-05,
75
- "loss": 0.4636,
76
  "step": 5000
77
  },
78
  {
79
- "epoch": 10.204081632653061,
80
- "eval_loss": 0.42910683155059814,
81
- "eval_runtime": 403.7863,
82
- "eval_samples_per_second": 16.62,
83
- "eval_steps_per_second": 0.52,
84
  "step": 5000
85
- },
86
- {
87
- "epoch": 12.244897959183673,
88
- "grad_norm": 1.92360520362854,
89
- "learning_rate": 4.9975e-05,
90
- "loss": 0.4555,
91
- "step": 6000
92
- },
93
- {
94
- "epoch": 12.244897959183673,
95
- "eval_loss": 0.42244505882263184,
96
- "eval_runtime": 379.3426,
97
- "eval_samples_per_second": 17.691,
98
- "eval_steps_per_second": 0.554,
99
- "step": 6000
100
- },
101
- {
102
- "epoch": 14.285714285714286,
103
- "grad_norm": 2.303443670272827,
104
- "learning_rate": 5.83e-05,
105
- "loss": 0.4471,
106
- "step": 7000
107
- },
108
- {
109
- "epoch": 14.285714285714286,
110
- "eval_loss": 0.4228420555591583,
111
- "eval_runtime": 470.6545,
112
- "eval_samples_per_second": 14.259,
113
- "eval_steps_per_second": 0.446,
114
- "step": 7000
115
- },
116
- {
117
- "epoch": 16.3265306122449,
118
- "grad_norm": 1.5780209302902222,
119
- "learning_rate": 6.663333333333333e-05,
120
- "loss": 0.4421,
121
- "step": 8000
122
- },
123
- {
124
- "epoch": 16.3265306122449,
125
- "eval_loss": 0.42195653915405273,
126
- "eval_runtime": 458.745,
127
- "eval_samples_per_second": 14.629,
128
- "eval_steps_per_second": 0.458,
129
- "step": 8000
130
- },
131
- {
132
- "epoch": 18.367346938775512,
133
- "grad_norm": 2.230262041091919,
134
- "learning_rate": 7.495e-05,
135
- "loss": 0.438,
136
- "step": 9000
137
- },
138
- {
139
- "epoch": 18.367346938775512,
140
- "eval_loss": 0.4210755228996277,
141
- "eval_runtime": 449.0465,
142
- "eval_samples_per_second": 14.945,
143
- "eval_steps_per_second": 0.468,
144
- "step": 9000
145
- },
146
- {
147
- "epoch": 20.408163265306122,
148
- "grad_norm": 2.0010855197906494,
149
- "learning_rate": 8.328333333333333e-05,
150
- "loss": 0.4375,
151
- "step": 10000
152
- },
153
- {
154
- "epoch": 20.408163265306122,
155
- "eval_loss": 0.4254090189933777,
156
- "eval_runtime": 433.4203,
157
- "eval_samples_per_second": 15.484,
158
- "eval_steps_per_second": 0.485,
159
- "step": 10000
160
  }
161
  ],
162
- "logging_steps": 1000,
163
  "max_steps": 100000,
164
  "num_input_tokens_seen": 0,
165
- "num_train_epochs": 205,
166
- "save_steps": 10000,
167
  "stateful_callbacks": {
168
  "TrainerControl": {
169
  "args": {
@@ -176,8 +73,8 @@
176
  "attributes": {}
177
  }
178
  },
179
- "total_flos": 3.444146373783773e+16,
180
- "train_batch_size": 32,
181
  "trial_name": null,
182
  "trial_params": null
183
  }
 
1
  {
2
+ "best_metric": 0.436745822429657,
3
+ "best_model_checkpoint": "./speecht5-tts-vie\\checkpoint-5000",
4
+ "epoch": 2.7487630566245187,
5
  "eval_steps": 1000,
6
+ "global_step": 5000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.5497526113249038,
13
+ "eval_loss": 0.5397089123725891,
14
+ "eval_runtime": 246.0666,
15
+ "eval_samples_per_second": 50.669,
16
+ "eval_steps_per_second": 3.17,
17
  "step": 1000
18
  },
19
  {
20
+ "epoch": 1.0995052226498077,
21
+ "eval_loss": 0.5124471187591553,
22
+ "eval_runtime": 233.1296,
23
+ "eval_samples_per_second": 53.481,
24
+ "eval_steps_per_second": 3.346,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  "step": 2000
26
  },
27
  {
28
+ "epoch": 1.6492578339747115,
29
+ "eval_loss": 0.4633851647377014,
30
+ "eval_runtime": 232.6741,
31
+ "eval_samples_per_second": 53.586,
32
+ "eval_steps_per_second": 3.352,
 
 
 
 
 
 
 
33
  "step": 3000
34
  },
35
  {
36
+ "epoch": 2.1990104452996153,
37
+ "eval_loss": 0.4454704225063324,
38
+ "eval_runtime": 233.2342,
39
+ "eval_samples_per_second": 53.457,
40
+ "eval_steps_per_second": 3.344,
 
 
 
 
 
 
 
41
  "step": 4000
42
  },
43
  {
44
+ "epoch": 2.7487630566245187,
45
+ "grad_norm": 3.8025379180908203,
46
  "learning_rate": 4.1641666666666665e-05,
47
+ "loss": 0.5624,
48
  "step": 5000
49
  },
50
  {
51
+ "epoch": 2.7487630566245187,
52
+ "eval_loss": 0.436745822429657,
53
+ "eval_runtime": 231.6026,
54
+ "eval_samples_per_second": 53.834,
55
+ "eval_steps_per_second": 3.368,
56
  "step": 5000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
57
  }
58
  ],
59
+ "logging_steps": 5000,
60
  "max_steps": 100000,
61
  "num_input_tokens_seen": 0,
62
+ "num_train_epochs": 55,
63
+ "save_steps": 5000,
64
  "stateful_callbacks": {
65
  "TrainerControl": {
66
  "args": {
 
73
  "attributes": {}
74
  }
75
  },
76
+ "total_flos": 7921363059826128.0,
77
+ "train_batch_size": 16,
78
  "trial_name": null,
79
  "trial_params": null
80
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95f25db4da551fc09cd5e5e24eb8b5d820beb00de5789c705e05ff4264602603
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:512bd16045d9f54ac4b4eaf8dda145bb7ffb9b33ba3722d48f942a6a81d08d16
3
  size 5304