jvadlamudi2 commited on
Commit
bfa5bd3
·
1 Parent(s): b230c25

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -5,9 +5,9 @@
5
  "eval_runtime": 1.4896,
6
  "eval_samples_per_second": 75.188,
7
  "eval_steps_per_second": 2.685,
8
- "total_flos": 6.651462652615066e+16,
9
- "train_loss": 0.6625232639766875,
10
- "train_runtime": 75.1281,
11
- "train_samples_per_second": 35.619,
12
- "train_steps_per_second": 0.28
13
  }
 
5
  "eval_runtime": 1.4896,
6
  "eval_samples_per_second": 75.188,
7
  "eval_steps_per_second": 2.685,
8
+ "total_flos": 6.644005855919309e+16,
9
+ "train_loss": 0.6323768979027158,
10
+ "train_runtime": 83.6467,
11
+ "train_samples_per_second": 31.956,
12
+ "train_steps_per_second": 0.251
13
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:05ae6ea2db30a60449e7f2e2047fd7f506db56e77177f16a5117381cbe15cd2d
3
  size 110394865
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f630ad771bbcb24936d993b13a333378922e5cc7d34ffea92fe135220b531c6e
3
  size 110394865
runs/Jul24_17-23-16_79617dc78cd9/events.out.tfevents.1690220278.79617dc78cd9.248.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:995812684248a256ee094931636575084f200a159b86589641f5e929b3a098be
3
+ size 4839
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
- "total_flos": 6.651462652615066e+16,
4
- "train_loss": 0.6625232639766875,
5
- "train_runtime": 75.1281,
6
- "train_samples_per_second": 35.619,
7
- "train_steps_per_second": 0.28
8
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "total_flos": 6.644005855919309e+16,
4
+ "train_loss": 0.6323768979027158,
5
+ "train_runtime": 83.6467,
6
+ "train_samples_per_second": 31.956,
7
+ "train_steps_per_second": 0.251
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.6875,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-jvadlamudi2/checkpoint-21",
4
  "epoch": 3.0,
5
  "global_step": 21,
6
  "is_hyper_param_search": false,
@@ -9,56 +9,56 @@
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
- "eval_accuracy": 0.5892857142857143,
13
- "eval_loss": 0.6659354567527771,
14
- "eval_runtime": 0.8649,
15
- "eval_samples_per_second": 129.489,
16
- "eval_steps_per_second": 4.625,
17
  "step": 7
18
  },
19
  {
20
  "epoch": 1.43,
21
  "learning_rate": 3.055555555555556e-05,
22
- "loss": 0.6765,
23
  "step": 10
24
  },
25
  {
26
  "epoch": 2.0,
27
- "eval_accuracy": 0.6517857142857143,
28
- "eval_loss": 0.6479455232620239,
29
- "eval_runtime": 0.8944,
30
- "eval_samples_per_second": 125.219,
31
- "eval_steps_per_second": 4.472,
32
  "step": 14
33
  },
34
  {
35
  "epoch": 2.86,
36
  "learning_rate": 2.777777777777778e-06,
37
- "loss": 0.6502,
38
  "step": 20
39
  },
40
  {
41
  "epoch": 3.0,
42
- "eval_accuracy": 0.6875,
43
- "eval_loss": 0.6389141082763672,
44
- "eval_runtime": 0.8926,
45
- "eval_samples_per_second": 125.472,
46
- "eval_steps_per_second": 4.481,
47
  "step": 21
48
  },
49
  {
50
  "epoch": 3.0,
51
  "step": 21,
52
- "total_flos": 6.651462652615066e+16,
53
- "train_loss": 0.6625232639766875,
54
- "train_runtime": 75.1281,
55
- "train_samples_per_second": 35.619,
56
- "train_steps_per_second": 0.28
57
  }
58
  ],
59
  "max_steps": 21,
60
  "num_train_epochs": 3,
61
- "total_flos": 6.651462652615066e+16,
62
  "trial_name": null,
63
  "trial_params": null
64
  }
 
1
  {
2
+ "best_metric": 0.7142857142857143,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-jvadlamudi2/checkpoint-14",
4
  "epoch": 3.0,
5
  "global_step": 21,
6
  "is_hyper_param_search": false,
 
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
+ "eval_accuracy": 0.5982142857142857,
13
+ "eval_loss": 0.6469235420227051,
14
+ "eval_runtime": 0.9046,
15
+ "eval_samples_per_second": 123.807,
16
+ "eval_steps_per_second": 4.422,
17
  "step": 7
18
  },
19
  {
20
  "epoch": 1.43,
21
  "learning_rate": 3.055555555555556e-05,
22
+ "loss": 0.6532,
23
  "step": 10
24
  },
25
  {
26
  "epoch": 2.0,
27
+ "eval_accuracy": 0.7142857142857143,
28
+ "eval_loss": 0.599132239818573,
29
+ "eval_runtime": 0.9359,
30
+ "eval_samples_per_second": 119.676,
31
+ "eval_steps_per_second": 4.274,
32
  "step": 14
33
  },
34
  {
35
  "epoch": 2.86,
36
  "learning_rate": 2.777777777777778e-06,
37
+ "loss": 0.6128,
38
  "step": 20
39
  },
40
  {
41
  "epoch": 3.0,
42
+ "eval_accuracy": 0.7142857142857143,
43
+ "eval_loss": 0.5942407846450806,
44
+ "eval_runtime": 0.843,
45
+ "eval_samples_per_second": 132.865,
46
+ "eval_steps_per_second": 4.745,
47
  "step": 21
48
  },
49
  {
50
  "epoch": 3.0,
51
  "step": 21,
52
+ "total_flos": 6.644005855919309e+16,
53
+ "train_loss": 0.6323768979027158,
54
+ "train_runtime": 83.6467,
55
+ "train_samples_per_second": 31.956,
56
+ "train_steps_per_second": 0.251
57
  }
58
  ],
59
  "max_steps": 21,
60
  "num_train_epochs": 3,
61
+ "total_flos": 6.644005855919309e+16,
62
  "trial_name": null,
63
  "trial_params": null
64
  }