Add model files and configs

Files changed (6) hide show

all_results.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
     "epoch": 3.0,
-    "train_loss": 0.5741025606791178,
-    "train_runtime": 21.8228,
-    "train_samples_per_second": 8.111,
-    "train_steps_per_second": 1.1
 }

 {
     "epoch": 3.0,
+    "train_loss": 0.625487764676412,
+    "train_runtime": 21.7193,
+    "train_samples_per_second": 8.288,
+    "train_steps_per_second": 1.105
 }

onnx/model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c148401cd25f4710e21636a23f9aeae74eaa1a4943dc06982f231a40b2810cba
 size 87112360

 version https://git-lfs.github.com/spec/v1
+oid sha256:e8fd0c18e7ecafd2579724b6f3ce126621bdb13f8381358d9cc79f55e82fdd52
 size 87112360

quantize_config.json CHANGED Viewed

@@ -4,30 +4,30 @@
     "per_model_config": {
         "model": {
             "op_types": [
-                "Expand",
-                "ConstantOfShape",
-                "MatMul",
-                "Div",
-                "Concat",
-                "Softmax",
                 "Erf",
                 "Sqrt",
-                "Gemm",
-                "Constant",
-                "Transpose",
-                "Equal",
-                "Sub",
-                "Reshape",
                 "Shape",
-                "ReduceMean",
                 "Unsqueeze",
-                "Gather",
                 "Where",
                 "Mul",
-                "Conv",
-                "Pow",
-                "Add",
-                "Slice"
             ],
             "weight_type": "QUInt8"
         }

     "per_model_config": {
         "model": {
             "op_types": [
+                "Constant",
+                "Gather",
                 "Erf",
+                "Add",
                 "Sqrt",
+                "Pow",
+                "Concat",
                 "Shape",
+                "Reshape",
+                "Expand",
+                "Div",
+                "Sub",
+                "Gemm",
+                "MatMul",
+                "ConstantOfShape",
                 "Unsqueeze",
+                "Slice",
+                "Conv",
                 "Where",
+                "Softmax",
                 "Mul",
+                "ReduceMean",
+                "Equal",
+                "Transpose"
             ],
             "weight_type": "QUInt8"
         }

train_results.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
     "epoch": 3.0,
-    "train_loss": 0.5741025606791178,
-    "train_runtime": 21.8228,
-    "train_samples_per_second": 8.111,
-    "train_steps_per_second": 1.1
 }

 {
     "epoch": 3.0,
+    "train_loss": 0.625487764676412,
+    "train_runtime": 21.7193,
+    "train_samples_per_second": 8.288,
+    "train_steps_per_second": 1.105
 }

trainer_state.json CHANGED Viewed

@@ -11,18 +11,18 @@
     {
       "epoch": 3.0,
       "step": 24,
-      "total_flos": 1.3717678211371008e+16,
-      "train_loss": 0.5741025606791178,
-      "train_runtime": 21.8228,
-      "train_samples_per_second": 8.111,
-      "train_steps_per_second": 1.1
     }
   ],
   "logging_steps": 500,
   "max_steps": 24,
   "num_train_epochs": 3,
   "save_steps": 500,
-  "total_flos": 1.3717678211371008e+16,
   "trial_name": null,
   "trial_params": null
 }

     {
       "epoch": 3.0,
       "step": 24,
+      "total_flos": 1.395018123190272e+16,
+      "train_loss": 0.625487764676412,
+      "train_runtime": 21.7193,
+      "train_samples_per_second": 8.288,
+      "train_steps_per_second": 1.105
     }
   ],
   "logging_steps": 500,
   "max_steps": 24,
   "num_train_epochs": 3,
   "save_steps": 500,
+  "total_flos": 1.395018123190272e+16,
   "trial_name": null,
   "trial_params": null
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:07eb2bb8358ee16c8d302239eea02906b9e53fe7bde34e6c71c0ca9b0d1f2055
 size 4536

 version https://git-lfs.github.com/spec/v1
+oid sha256:e50035b9f4f234d430aefeaf1426c9fcd9a533f70893f5d51eb3c86a1fa1e3e5
 size 4536