nomsgadded commited on
Commit
2fcdf67
1 Parent(s): 45bc222

End of training

Browse files
Files changed (4) hide show
  1. README.md +3 -1
  2. all_results.json +5 -5
  3. train_results.json +5 -5
  4. trainer_state.json +30 -12
README.md CHANGED
@@ -2,6 +2,8 @@
2
  license: other
3
  base_model: nvidia/mit-b0
4
  tags:
 
 
5
  - generated_from_trainer
6
  model-index:
7
  - name: Segments
@@ -13,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  # Segments
15
 
16
- This model is a fine-tuned version of [nvidia/mit-b0](https://huggingface.co/nvidia/mit-b0) on an unknown dataset.
17
 
18
  ## Model description
19
 
 
2
  license: other
3
  base_model: nvidia/mit-b0
4
  tags:
5
+ - image-segmentation
6
+ - vision
7
  - generated_from_trainer
8
  model-index:
9
  - name: Segments
 
15
 
16
  # Segments
17
 
18
+ This model is a fine-tuned version of [nvidia/mit-b0](https://huggingface.co/nvidia/mit-b0) on the segments/sidewalk-semantic dataset.
19
 
20
  ## Model description
21
 
all_results.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "epoch": 0.99,
3
  "eval_accuracy_construction-bridge": 0.0,
4
  "eval_accuracy_construction-building": 0.9044887536731845,
5
  "eval_accuracy_construction-door": 0.0,
@@ -77,8 +77,8 @@
77
  "eval_runtime": 166.5888,
78
  "eval_samples_per_second": 0.9,
79
  "eval_steps_per_second": 0.114,
80
- "train_loss": 3.0431386119914503,
81
- "train_runtime": 103.8023,
82
- "train_samples_per_second": 8.189,
83
- "train_steps_per_second": 0.511
84
  }
 
1
  {
2
+ "epoch": 29.72,
3
  "eval_accuracy_construction-bridge": 0.0,
4
  "eval_accuracy_construction-building": 0.9044887536731845,
5
  "eval_accuracy_construction-door": 0.0,
 
77
  "eval_runtime": 166.5888,
78
  "eval_samples_per_second": 0.9,
79
  "eval_steps_per_second": 0.114,
80
+ "train_loss": 1.150932288019912,
81
+ "train_runtime": 3015.3294,
82
+ "train_samples_per_second": 8.457,
83
+ "train_steps_per_second": 0.527
84
  }
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 0.99,
3
- "train_loss": 3.0431386119914503,
4
- "train_runtime": 103.8023,
5
- "train_samples_per_second": 8.189,
6
- "train_steps_per_second": 0.511
7
  }
 
1
  {
2
+ "epoch": 29.72,
3
+ "train_loss": 1.150932288019912,
4
+ "train_runtime": 3015.3294,
5
+ "train_samples_per_second": 8.457,
6
+ "train_steps_per_second": 0.527
7
  }
trainer_state.json CHANGED
@@ -1,28 +1,46 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.9906542056074766,
5
  "eval_steps": 500,
6
- "global_step": 53,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.99,
13
- "step": 53,
14
- "total_flos": 1.4897641867444224e+16,
15
- "train_loss": 3.0431386119914503,
16
- "train_runtime": 103.8023,
17
- "train_samples_per_second": 8.189,
18
- "train_steps_per_second": 0.511
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
19
  }
20
  ],
21
  "logging_steps": 500,
22
- "max_steps": 53,
23
- "num_train_epochs": 1,
24
  "save_steps": 200,
25
- "total_flos": 1.4897641867444224e+16,
26
  "trial_name": null,
27
  "trial_params": null
28
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 29.7196261682243,
5
  "eval_steps": 500,
6
+ "global_step": 1590,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 9.35,
13
+ "learning_rate": 3.4276729559748424e-05,
14
+ "loss": 1.6882,
15
+ "step": 500
16
+ },
17
+ {
18
+ "epoch": 18.69,
19
+ "learning_rate": 1.8553459119496856e-05,
20
+ "loss": 0.9858,
21
+ "step": 1000
22
+ },
23
+ {
24
+ "epoch": 28.04,
25
+ "learning_rate": 2.830188679245283e-06,
26
+ "loss": 0.8402,
27
+ "step": 1500
28
+ },
29
+ {
30
+ "epoch": 29.72,
31
+ "step": 1590,
32
+ "total_flos": 4.438724285646766e+17,
33
+ "train_loss": 1.150932288019912,
34
+ "train_runtime": 3015.3294,
35
+ "train_samples_per_second": 8.457,
36
+ "train_steps_per_second": 0.527
37
  }
38
  ],
39
  "logging_steps": 500,
40
+ "max_steps": 1590,
41
+ "num_train_epochs": 30,
42
  "save_steps": 200,
43
+ "total_flos": 4.438724285646766e+17,
44
  "trial_name": null,
45
  "trial_params": null
46
  }