Augusto777 commited on
Commit
51704cd
1 Parent(s): 8faa3f7

End of training

Browse files
Files changed (5) hide show
  1. README.md +2 -2
  2. all_results.json +11 -6
  3. eval_results.json +8 -0
  4. train_results.json +6 -6
  5. trainer_state.json +84 -24
README.md CHANGED
@@ -17,8 +17,8 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.4312
21
- - Accuracy: 0.9
22
 
23
  ## Model description
24
 
 
17
 
18
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 0.6300
21
+ - Accuracy: 0.95
22
 
23
  ## Model description
24
 
all_results.json CHANGED
@@ -1,8 +1,13 @@
1
  {
2
- "epoch": 2.0,
3
- "total_flos": 2.789761632731136e+16,
4
- "train_loss": 1.476369063059489,
5
- "train_runtime": 26.7457,
6
- "train_samples_per_second": 20.19,
7
- "train_steps_per_second": 0.112
 
 
 
 
 
8
  }
 
1
  {
2
+ "epoch": 8.0,
3
+ "eval_accuracy": 0.95,
4
+ "eval_loss": 0.6299833059310913,
5
+ "eval_runtime": 0.3394,
6
+ "eval_samples_per_second": 58.919,
7
+ "eval_steps_per_second": 2.946,
8
+ "total_flos": 1.1159046530924544e+17,
9
+ "train_loss": 0.795779287815094,
10
+ "train_runtime": 107.6532,
11
+ "train_samples_per_second": 20.064,
12
+ "train_steps_per_second": 0.111
13
  }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 8.0,
3
+ "eval_accuracy": 0.95,
4
+ "eval_loss": 0.6299833059310913,
5
+ "eval_runtime": 0.3394,
6
+ "eval_samples_per_second": 58.919,
7
+ "eval_steps_per_second": 2.946
8
+ }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.0,
3
- "total_flos": 2.789761632731136e+16,
4
- "train_loss": 1.476369063059489,
5
- "train_runtime": 26.7457,
6
- "train_samples_per_second": 20.19,
7
- "train_steps_per_second": 0.112
8
  }
 
1
  {
2
+ "epoch": 8.0,
3
+ "total_flos": 1.1159046530924544e+17,
4
+ "train_loss": 0.795779287815094,
5
+ "train_runtime": 107.6532,
6
+ "train_samples_per_second": 20.064,
7
+ "train_steps_per_second": 0.111
8
  }
trainer_state.json CHANGED
@@ -1,46 +1,106 @@
1
  {
2
- "best_metric": 0.5,
3
- "best_model_checkpoint": "vit-base-patch16-224-MSC-dmae/checkpoint-3",
4
- "epoch": 2.0,
5
  "eval_steps": 500,
6
- "global_step": 3,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.67,
13
- "eval_accuracy": 0.15,
14
- "eval_loss": 1.6465644836425781,
15
- "eval_runtime": 0.2774,
16
- "eval_samples_per_second": 72.11,
17
- "eval_steps_per_second": 3.606,
18
  "step": 1
19
  },
20
  {
21
  "epoch": 2.0,
22
- "eval_accuracy": 0.5,
23
- "eval_loss": 1.2257916927337646,
24
- "eval_runtime": 0.3307,
25
- "eval_samples_per_second": 60.471,
26
- "eval_steps_per_second": 3.024,
27
  "step": 3
28
  },
29
  {
30
- "epoch": 2.0,
31
- "step": 3,
32
- "total_flos": 2.789761632731136e+16,
33
- "train_loss": 1.476369063059489,
34
- "train_runtime": 26.7457,
35
- "train_samples_per_second": 20.19,
36
- "train_steps_per_second": 0.112
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
37
  }
38
  ],
39
  "logging_steps": 10,
40
- "max_steps": 3,
41
- "num_train_epochs": 3,
42
  "save_steps": 500,
43
- "total_flos": 2.789761632731136e+16,
44
  "trial_name": null,
45
  "trial_params": null
46
  }
 
1
  {
2
+ "best_metric": 0.95,
3
+ "best_model_checkpoint": "vit-base-patch16-224-MSC-dmae/checkpoint-7",
4
+ "epoch": 8.0,
5
  "eval_steps": 500,
6
+ "global_step": 12,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.67,
13
+ "eval_accuracy": 0.5,
14
+ "eval_loss": 1.2257916927337646,
15
+ "eval_runtime": 0.3201,
16
+ "eval_samples_per_second": 62.477,
17
+ "eval_steps_per_second": 3.124,
18
  "step": 1
19
  },
20
  {
21
  "epoch": 2.0,
22
+ "eval_accuracy": 0.7,
23
+ "eval_loss": 1.0536372661590576,
24
+ "eval_runtime": 0.3238,
25
+ "eval_samples_per_second": 61.768,
26
+ "eval_steps_per_second": 3.088,
27
  "step": 3
28
  },
29
  {
30
+ "epoch": 2.67,
31
+ "eval_accuracy": 0.75,
32
+ "eval_loss": 0.9143384099006653,
33
+ "eval_runtime": 0.3026,
34
+ "eval_samples_per_second": 66.089,
35
+ "eval_steps_per_second": 3.304,
36
+ "step": 4
37
+ },
38
+ {
39
+ "epoch": 4.0,
40
+ "eval_accuracy": 0.9,
41
+ "eval_loss": 0.6899412870407104,
42
+ "eval_runtime": 0.3297,
43
+ "eval_samples_per_second": 60.655,
44
+ "eval_steps_per_second": 3.033,
45
+ "step": 6
46
+ },
47
+ {
48
+ "epoch": 4.67,
49
+ "eval_accuracy": 0.95,
50
+ "eval_loss": 0.6299833059310913,
51
+ "eval_runtime": 0.286,
52
+ "eval_samples_per_second": 69.919,
53
+ "eval_steps_per_second": 3.496,
54
+ "step": 7
55
+ },
56
+ {
57
+ "epoch": 6.0,
58
+ "eval_accuracy": 0.9,
59
+ "eval_loss": 0.5069305896759033,
60
+ "eval_runtime": 0.3181,
61
+ "eval_samples_per_second": 62.873,
62
+ "eval_steps_per_second": 3.144,
63
+ "step": 9
64
+ },
65
+ {
66
+ "epoch": 6.67,
67
+ "learning_rate": 1e-05,
68
+ "loss": 0.8554,
69
+ "step": 10
70
+ },
71
+ {
72
+ "epoch": 6.67,
73
+ "eval_accuracy": 0.9,
74
+ "eval_loss": 0.46708640456199646,
75
+ "eval_runtime": 0.317,
76
+ "eval_samples_per_second": 63.085,
77
+ "eval_steps_per_second": 3.154,
78
+ "step": 10
79
+ },
80
+ {
81
+ "epoch": 8.0,
82
+ "eval_accuracy": 0.9,
83
+ "eval_loss": 0.43121227622032166,
84
+ "eval_runtime": 0.3145,
85
+ "eval_samples_per_second": 63.594,
86
+ "eval_steps_per_second": 3.18,
87
+ "step": 12
88
+ },
89
+ {
90
+ "epoch": 8.0,
91
+ "step": 12,
92
+ "total_flos": 1.1159046530924544e+17,
93
+ "train_loss": 0.795779287815094,
94
+ "train_runtime": 107.6532,
95
+ "train_samples_per_second": 20.064,
96
+ "train_steps_per_second": 0.111
97
  }
98
  ],
99
  "logging_steps": 10,
100
+ "max_steps": 12,
101
+ "num_train_epochs": 12,
102
  "save_steps": 500,
103
+ "total_flos": 1.1159046530924544e+17,
104
  "trial_name": null,
105
  "trial_params": null
106
  }