gustavomalkomes commited on
Commit
54724c8
·
verified ·
1 Parent(s): d3549a6

End of training

Browse files
README.md CHANGED
@@ -3,7 +3,11 @@ library_name: transformers
3
  license: apache-2.0
4
  base_model: google/vit-base-patch16-224-in21k
5
  tags:
 
 
6
  - generated_from_trainer
 
 
7
  model-index:
8
  - name: vit-base-patch16-224-in21k
9
  results: []
@@ -14,7 +18,13 @@ should probably proofread and complete it, then remove this comment. -->
14
 
15
  # vit-base-patch16-224-in21k
16
 
17
- This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on an unknown dataset.
 
 
 
 
 
 
18
 
19
  ## Model description
20
 
 
3
  license: apache-2.0
4
  base_model: google/vit-base-patch16-224-in21k
5
  tags:
6
+ - image-classification
7
+ - vision
8
  - generated_from_trainer
9
+ metrics:
10
+ - accuracy
11
  model-index:
12
  - name: vit-base-patch16-224-in21k
13
  results: []
 
18
 
19
  # vit-base-patch16-224-in21k
20
 
21
+ This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the chainyo/rvl-cdip dataset.
22
+ It achieves the following results on the evaluation set:
23
+ - Loss: nan
24
+ - Accuracy: 0.0630
25
+ - Memory Allocated (gb): 1.53
26
+ - Max Memory Allocated (gb): 1.61
27
+ - Total Memory Available (gb): 126.62
28
 
29
  ## Model description
30
 
all_results.json CHANGED
@@ -2,15 +2,15 @@
2
  "epoch": 3.0,
3
  "eval_accuracy": 0.06302083333333333,
4
  "eval_loss": NaN,
5
- "eval_runtime": 239.9792,
6
- "eval_samples_per_second": 200.017,
7
- "eval_steps_per_second": 3.125,
8
- "max_memory_allocated (GB)": 0.97,
9
- "memory_allocated (GB)": 0.97,
10
  "total_flos": 6.324139790696448e+19,
11
  "total_memory_available (GB)": 126.62,
12
  "train_loss": 0.0,
13
- "train_runtime": 81.7036,
14
- "train_samples_per_second": 9987.288,
15
- "train_steps_per_second": 1248.416
16
  }
 
2
  "epoch": 3.0,
3
  "eval_accuracy": 0.06302083333333333,
4
  "eval_loss": NaN,
5
+ "eval_runtime": 242.9557,
6
+ "eval_samples_per_second": 197.567,
7
+ "eval_steps_per_second": 3.087,
8
+ "max_memory_allocated (GB)": 1.61,
9
+ "memory_allocated (GB)": 1.53,
10
  "total_flos": 6.324139790696448e+19,
11
  "total_memory_available (GB)": 126.62,
12
  "train_loss": 0.0,
13
+ "train_runtime": 0.0058,
14
+ "train_samples_per_second": 140961263.636,
15
+ "train_steps_per_second": 17620222.735
16
  }
config.json CHANGED
@@ -54,6 +54,7 @@
54
  "num_channels": 3,
55
  "num_hidden_layers": 12,
56
  "patch_size": 16,
 
57
  "qkv_bias": true,
58
  "torch_dtype": "float32",
59
  "transformers_version": "4.45.2"
 
54
  "num_channels": 3,
55
  "num_hidden_layers": 12,
56
  "patch_size": 16,
57
+ "problem_type": "single_label_classification",
58
  "qkv_bias": true,
59
  "torch_dtype": "float32",
60
  "transformers_version": "4.45.2"
eval_results.json CHANGED
@@ -2,9 +2,9 @@
2
  "epoch": 3.0,
3
  "eval_accuracy": 0.06302083333333333,
4
  "eval_loss": NaN,
5
- "eval_runtime": 239.9792,
6
- "eval_samples_per_second": 200.017,
7
- "eval_steps_per_second": 3.125,
8
  "max_memory_allocated (GB)": 1.61,
9
  "memory_allocated (GB)": 1.53,
10
  "total_memory_available (GB)": 126.62
 
2
  "epoch": 3.0,
3
  "eval_accuracy": 0.06302083333333333,
4
  "eval_loss": NaN,
5
+ "eval_runtime": 242.9557,
6
+ "eval_samples_per_second": 197.567,
7
+ "eval_steps_per_second": 3.087,
8
  "max_memory_allocated (GB)": 1.61,
9
  "memory_allocated (GB)": 1.53,
10
  "total_memory_available (GB)": 126.62
runs/Nov06_05-38-19_gtown-28NZK54/events.out.tfevents.1730871752.gtown-28NZK54.8152.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6145d9b31fb5311809ed1dfa5cdf319e7b3bf62bf29e4339f335cffc11ebdc3
3
+ size 580
train_results.json CHANGED
@@ -5,7 +5,7 @@
5
  "total_flos": 6.324139790696448e+19,
6
  "total_memory_available (GB)": 126.62,
7
  "train_loss": 0.0,
8
- "train_runtime": 81.7036,
9
- "train_samples_per_second": 9987.288,
10
- "train_steps_per_second": 1248.416
11
  }
 
5
  "total_flos": 6.324139790696448e+19,
6
  "total_memory_available (GB)": 126.62,
7
  "train_loss": 0.0,
8
+ "train_runtime": 0.0058,
9
+ "train_samples_per_second": 140961263.636,
10
+ "train_steps_per_second": 17620222.735
11
  }
trainer_state.json CHANGED
@@ -2056,9 +2056,9 @@
2056
  "total_flos": 6.324139790696448e+19,
2057
  "total_memory_available (GB)": 126.62,
2058
  "train_loss": 0.0,
2059
- "train_runtime": 81.7036,
2060
- "train_samples_per_second": 9987.288,
2061
- "train_steps_per_second": 1248.416
2062
  }
2063
  ],
2064
  "logging_steps": 500,
 
2056
  "total_flos": 6.324139790696448e+19,
2057
  "total_memory_available (GB)": 126.62,
2058
  "train_loss": 0.0,
2059
+ "train_runtime": 0.0058,
2060
+ "train_samples_per_second": 140961263.636,
2061
+ "train_steps_per_second": 17620222.735
2062
  }
2063
  ],
2064
  "logging_steps": 500,