Nyanmero commited on
Commit
c3e2ea8
·
verified ·
1 Parent(s): 17fc66c

Training in progress, step 10000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27d48542b9818e4e4a293d1d8c9dda9547b0bc96dbdc8160cf051a53ac7d0273
3
  size 577859976
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:028bf0a6547388360f9d61c31c3d8c9ca8de5904332d974377c9e95b583d383e
3
  size 577859976
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d86043f2600663b53b4e1f7c4d965a4b0603ae1690e1cc9d9132974bf6057dfe
3
  size 1155913545
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcf8b26ebf1a2190706ede053bdef8e0b54454417751cf199f3280cb7f98d6ae
3
  size 1155913545
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d18ddaeceed99e79aa4ac5c182e18d8899aa358265dfca0c3e14dbc0359a6800
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3a189c587f71772a90681cf9309062314d7cbe24d1b7f1e4297726490f4dbbb
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:237b16a7ce9f6b5a014af36041f5a3bce3b97b7e8b3060da10452bd5dd7eb0ee
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fa224d225c0288a6e0a18c72b41fbc853d1c25b9331613205b078bf1090ba2c
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,254 +1,49 @@
1
  {
2
- "best_metric": 0.41689586639404297,
3
- "best_model_checkpoint": "./speecht5-tts-vie\\checkpoint-20000",
4
- "epoch": 13.743815283122595,
5
- "eval_steps": 1000,
6
- "global_step": 25000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
- {
12
- "epoch": 0.5497526113249038,
13
- "eval_loss": 0.5397089123725891,
14
- "eval_runtime": 246.0666,
15
- "eval_samples_per_second": 50.669,
16
- "eval_steps_per_second": 3.17,
17
- "step": 1000
18
- },
19
- {
20
- "epoch": 1.0995052226498077,
21
- "eval_loss": 0.5124471187591553,
22
- "eval_runtime": 233.1296,
23
- "eval_samples_per_second": 53.481,
24
- "eval_steps_per_second": 3.346,
25
- "step": 2000
26
- },
27
- {
28
- "epoch": 1.6492578339747115,
29
- "eval_loss": 0.4633851647377014,
30
- "eval_runtime": 232.6741,
31
- "eval_samples_per_second": 53.586,
32
- "eval_steps_per_second": 3.352,
33
- "step": 3000
34
- },
35
- {
36
- "epoch": 2.1990104452996153,
37
- "eval_loss": 0.4454704225063324,
38
- "eval_runtime": 233.2342,
39
- "eval_samples_per_second": 53.457,
40
- "eval_steps_per_second": 3.344,
41
- "step": 4000
42
- },
43
  {
44
  "epoch": 2.7487630566245187,
45
- "grad_norm": 3.8025379180908203,
46
- "learning_rate": 4.1641666666666665e-05,
47
- "loss": 0.5624,
48
  "step": 5000
49
  },
50
  {
51
  "epoch": 2.7487630566245187,
52
- "eval_loss": 0.436745822429657,
53
- "eval_runtime": 231.6026,
54
- "eval_samples_per_second": 53.834,
55
- "eval_steps_per_second": 3.368,
56
  "step": 5000
57
  },
58
- {
59
- "epoch": 3.298515667949423,
60
- "eval_loss": 0.43301576375961304,
61
- "eval_runtime": 231.9457,
62
- "eval_samples_per_second": 53.754,
63
- "eval_steps_per_second": 3.363,
64
- "step": 6000
65
- },
66
- {
67
- "epoch": 3.8482682792743264,
68
- "eval_loss": 0.43043527007102966,
69
- "eval_runtime": 232.7937,
70
- "eval_samples_per_second": 53.558,
71
- "eval_steps_per_second": 3.351,
72
- "step": 7000
73
- },
74
- {
75
- "epoch": 4.398020890599231,
76
- "eval_loss": 0.42659255862236023,
77
- "eval_runtime": 232.6331,
78
- "eval_samples_per_second": 53.595,
79
- "eval_steps_per_second": 3.353,
80
- "step": 8000
81
- },
82
- {
83
- "epoch": 4.947773501924134,
84
- "eval_loss": 0.4237697124481201,
85
- "eval_runtime": 335.3241,
86
- "eval_samples_per_second": 37.182,
87
- "eval_steps_per_second": 2.326,
88
- "step": 9000
89
- },
90
  {
91
  "epoch": 5.497526113249038,
92
- "grad_norm": 3.957423210144043,
93
- "learning_rate": 8.329166666666667e-05,
94
- "loss": 0.4668,
95
  "step": 10000
96
  },
97
  {
98
  "epoch": 5.497526113249038,
99
- "eval_loss": 0.43070951104164124,
100
- "eval_runtime": 338.8195,
101
- "eval_samples_per_second": 36.798,
102
- "eval_steps_per_second": 2.302,
103
  "step": 10000
104
- },
105
- {
106
- "epoch": 6.047278724573942,
107
- "eval_loss": 0.42637017369270325,
108
- "eval_runtime": 337.6097,
109
- "eval_samples_per_second": 36.93,
110
- "eval_steps_per_second": 2.31,
111
- "step": 11000
112
- },
113
- {
114
- "epoch": 6.597031335898846,
115
- "eval_loss": 0.4261023998260498,
116
- "eval_runtime": 351.5943,
117
- "eval_samples_per_second": 35.461,
118
- "eval_steps_per_second": 2.218,
119
- "step": 12000
120
- },
121
- {
122
- "epoch": 7.146783947223749,
123
- "eval_loss": 0.42608416080474854,
124
- "eval_runtime": 335.0357,
125
- "eval_samples_per_second": 37.214,
126
- "eval_steps_per_second": 2.328,
127
- "step": 13000
128
- },
129
- {
130
- "epoch": 7.696536558548653,
131
- "eval_loss": 0.4257422685623169,
132
- "eval_runtime": 334.2636,
133
- "eval_samples_per_second": 37.3,
134
- "eval_steps_per_second": 2.333,
135
- "step": 14000
136
- },
137
- {
138
- "epoch": 8.246289169873556,
139
- "grad_norm": 1.6813654899597168,
140
- "learning_rate": 9.659886363636365e-05,
141
- "loss": 0.4563,
142
- "step": 15000
143
- },
144
- {
145
- "epoch": 8.246289169873556,
146
- "eval_loss": 0.4219256639480591,
147
- "eval_runtime": 336.8999,
148
- "eval_samples_per_second": 37.008,
149
- "eval_steps_per_second": 2.315,
150
- "step": 15000
151
- },
152
- {
153
- "epoch": 8.796041781198461,
154
- "eval_loss": 0.42107194662094116,
155
- "eval_runtime": 339.383,
156
- "eval_samples_per_second": 36.737,
157
- "eval_steps_per_second": 2.298,
158
- "step": 16000
159
- },
160
- {
161
- "epoch": 9.345794392523365,
162
- "eval_loss": 0.42018377780914307,
163
- "eval_runtime": 336.8885,
164
- "eval_samples_per_second": 37.009,
165
- "eval_steps_per_second": 2.315,
166
- "step": 17000
167
- },
168
- {
169
- "epoch": 9.895547003848268,
170
- "eval_loss": 0.4306410551071167,
171
- "eval_runtime": 338.8623,
172
- "eval_samples_per_second": 36.794,
173
- "eval_steps_per_second": 2.302,
174
- "step": 18000
175
- },
176
- {
177
- "epoch": 10.445299615173171,
178
- "eval_loss": 0.4173683226108551,
179
- "eval_runtime": 382.8942,
180
- "eval_samples_per_second": 32.563,
181
- "eval_steps_per_second": 2.037,
182
- "step": 19000
183
- },
184
- {
185
- "epoch": 10.995052226498077,
186
- "grad_norm": 2.4157445430755615,
187
- "learning_rate": 9.091931818181819e-05,
188
- "loss": 0.4432,
189
- "step": 20000
190
- },
191
- {
192
- "epoch": 10.995052226498077,
193
- "eval_loss": 0.41689586639404297,
194
- "eval_runtime": 399.9359,
195
- "eval_samples_per_second": 31.175,
196
- "eval_steps_per_second": 1.95,
197
- "step": 20000
198
- },
199
- {
200
- "epoch": 11.54480483782298,
201
- "eval_loss": 0.4168870151042938,
202
- "eval_runtime": 381.0473,
203
- "eval_samples_per_second": 32.72,
204
- "eval_steps_per_second": 2.047,
205
- "step": 21000
206
- },
207
- {
208
- "epoch": 12.094557449147883,
209
- "eval_loss": 0.42138534784317017,
210
- "eval_runtime": 372.9871,
211
- "eval_samples_per_second": 33.427,
212
- "eval_steps_per_second": 2.091,
213
- "step": 22000
214
- },
215
- {
216
- "epoch": 12.644310060472787,
217
- "eval_loss": 0.42539912462234497,
218
- "eval_runtime": 449.8771,
219
- "eval_samples_per_second": 27.714,
220
- "eval_steps_per_second": 1.734,
221
- "step": 23000
222
- },
223
- {
224
- "epoch": 13.194062671797692,
225
- "eval_loss": 0.41935691237449646,
226
- "eval_runtime": 477.984,
227
- "eval_samples_per_second": 26.085,
228
- "eval_steps_per_second": 1.632,
229
- "step": 24000
230
- },
231
- {
232
- "epoch": 13.743815283122595,
233
- "grad_norm": 1.6161022186279297,
234
- "learning_rate": 8.523863636363637e-05,
235
- "loss": 0.4325,
236
- "step": 25000
237
- },
238
- {
239
- "epoch": 13.743815283122595,
240
- "eval_loss": 0.41808393597602844,
241
- "eval_runtime": 457.4883,
242
- "eval_samples_per_second": 27.253,
243
- "eval_steps_per_second": 1.705,
244
- "step": 25000
245
  }
246
  ],
247
  "logging_steps": 5000,
248
  "max_steps": 100000,
249
  "num_input_tokens_seen": 0,
250
  "num_train_epochs": 55,
251
- "save_steps": 5000,
252
  "stateful_callbacks": {
253
  "TrainerControl": {
254
  "args": {
@@ -261,7 +56,7 @@
261
  "attributes": {}
262
  }
263
  },
264
- "total_flos": 3.959974797228648e+16,
265
  "train_batch_size": 16,
266
  "trial_name": null,
267
  "trial_params": null
 
1
  {
2
+ "best_metric": NaN,
3
+ "best_model_checkpoint": "./speecht5-tts-vie\\checkpoint-10000",
4
+ "epoch": 5.497526113249038,
5
+ "eval_steps": 5000,
6
+ "global_step": 10000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  {
12
  "epoch": 2.7487630566245187,
13
+ "grad_norm": NaN,
14
+ "learning_rate": 0.0016583333333333333,
15
+ "loss": 1.0616,
16
  "step": 5000
17
  },
18
  {
19
  "epoch": 2.7487630566245187,
20
+ "eval_loss": NaN,
21
+ "eval_runtime": 332.2788,
22
+ "eval_samples_per_second": 37.523,
23
+ "eval_steps_per_second": 2.347,
24
  "step": 5000
25
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
26
  {
27
  "epoch": 5.497526113249038,
28
+ "grad_norm": NaN,
29
+ "learning_rate": 0.0016583333333333333,
30
+ "loss": 0.0,
31
  "step": 10000
32
  },
33
  {
34
  "epoch": 5.497526113249038,
35
+ "eval_loss": NaN,
36
+ "eval_runtime": 309.5607,
37
+ "eval_samples_per_second": 40.276,
38
+ "eval_steps_per_second": 2.52,
39
  "step": 10000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
40
  }
41
  ],
42
  "logging_steps": 5000,
43
  "max_steps": 100000,
44
  "num_input_tokens_seen": 0,
45
  "num_train_epochs": 55,
46
+ "save_steps": 10000,
47
  "stateful_callbacks": {
48
  "TrainerControl": {
49
  "args": {
 
56
  "attributes": {}
57
  }
58
  },
59
+ "total_flos": 1.5859575977955336e+16,
60
  "train_batch_size": 16,
61
  "trial_name": null,
62
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:512bd16045d9f54ac4b4eaf8dda145bb7ffb9b33ba3722d48f942a6a81d08d16
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ff7b688be8240deab18d13754e0ca0ed159df97ff4667f041eadd1a25f5182d
3
  size 5304