End of training

Files changed (4) hide show

README.md CHANGED Viewed

@@ -17,13 +17,13 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the food101 dataset.
 It achieves the following results on the evaluation set:
-- eval_loss: 0.7651
-- eval_accuracy: 0.8156
-- eval_runtime: 154.1129
-- eval_samples_per_second: 98.305
-- eval_steps_per_second: 6.145
-- epoch: 26.4
-- step: 25000
 ## Model description

 This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the food101 dataset.
 It achieves the following results on the evaluation set:
+- eval_loss: 0.7609
+- eval_accuracy: 0.8149
+- eval_runtime: 155.6779
+- eval_samples_per_second: 97.316
+- eval_steps_per_second: 6.083
+- epoch: 27.46
+- step: 26000
 ## Model description

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c07c9f219ab17dddb048edc81f52ed98de5117148c986cc434f835c984a9b252
 size 343528508

 version https://git-lfs.github.com/spec/v1
+oid sha256:57b51b89e39855e40356cecad14619ced2468fdb8d02c56cef592f87b8733b9d
 size 343528508

runs/Feb05_03-08-58_983d148b451b/events.out.tfevents.1707102539.983d148b451b.26.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3d08cb3b0549f26d042533282b0adaec04901eddacd691dc2a26a4ad234f3355
-size 21382

 version https://git-lfs.github.com/spec/v1
+oid sha256:3e3955422c6c1463171f2ade37cabbb1e2b34ea1916abd958b3a0ae68b6b8a0f
+size 21871

trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": 0.8201980198019801,
   "best_model_checkpoint": "food-image-classification/checkpoint-22000",
-  "epoch": 26.399155227032736,
   "eval_steps": 1000,
-  "global_step": 25000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -382,6 +382,21 @@
       "eval_samples_per_second": 98.305,
       "eval_steps_per_second": 6.145,
       "step": 25000
     }
   ],
   "logging_steps": 1000,
@@ -389,7 +404,7 @@
   "num_input_tokens_seen": 0,
   "num_train_epochs": 500,
   "save_steps": 1000,
-  "total_flos": 1.240810652804309e+20,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": 0.8201980198019801,
   "best_model_checkpoint": "food-image-classification/checkpoint-22000",
+  "epoch": 27.455121436114045,
   "eval_steps": 1000,
+  "global_step": 26000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 98.305,
       "eval_steps_per_second": 6.145,
       "step": 25000
+    },
+    {
+      "epoch": 27.46,
+      "learning_rate": 2.7455121436114044e-05,
+      "loss": 0.3274,
+      "step": 26000
+    },
+    {
+      "epoch": 27.46,
+      "eval_accuracy": 0.8148514851485148,
+      "eval_loss": 0.760901927947998,
+      "eval_runtime": 155.6779,
+      "eval_samples_per_second": 97.316,
+      "eval_steps_per_second": 6.083,
+      "step": 26000
     }
   ],
   "logging_steps": 1000,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 500,
   "save_steps": 1000,
+  "total_flos": 1.2904433271108772e+20,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null