Add model files and configs

Files changed (6) hide show

all_results.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
     "epoch": 3.0,
-    "train_loss": 0.5953705310821533,
-    "train_runtime": 22.7307,
-    "train_samples_per_second": 8.183,
-    "train_steps_per_second": 1.056
 }

 {
     "epoch": 3.0,
+    "train_loss": 0.6169168684217665,
+    "train_runtime": 24.7305,
+    "train_samples_per_second": 7.885,
+    "train_steps_per_second": 1.092
 }

onnx/model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b6a382ddc11e568915fa205c55174e03550e69c4a0f771a5899549a6a952a5d3
 size 87112360

 version https://git-lfs.github.com/spec/v1
+oid sha256:5a2c65e770aa3d504ae301be61c49eb14aa6aa2ccbaf45600c3c567d883b02d0
 size 87112360

quantize_config.json CHANGED Viewed

@@ -4,30 +4,30 @@
     "per_model_config": {
         "model": {
             "op_types": [
-                "MatMul",
                 "Sqrt",
-                "ConstantOfShape",
-                "Mul",
-                "Concat",
-                "Gather",
-                "Transpose",
-                "Expand",
-                "Gemm",
-                "Div",
-                "ReduceMean",
-                "Conv",
                 "Unsqueeze",
-                "Sub",
                 "Softmax",
-                "Add",
                 "Slice",
-                "Pow",
-                "Erf",
-                "Where",
-                "Constant",
                 "Reshape",
                 "Shape",
-                "Equal"
             ],
             "weight_type": "QUInt8"
         }

     "per_model_config": {
         "model": {
             "op_types": [
                 "Sqrt",
+                "Pow",
                 "Unsqueeze",
                 "Softmax",
                 "Slice",
+                "ReduceMean",
+                "Gather",
+                "Concat",
+                "Mul",
+                "Conv",
+                "Expand",
+                "Gemm",
+                "Transpose",
                 "Reshape",
+                "Add",
                 "Shape",
+                "Constant",
+                "Where",
+                "Sub",
+                "Equal",
+                "Erf",
+                "ConstantOfShape",
+                "MatMul",
+                "Div"
             ],
             "weight_type": "QUInt8"
         }

train_results.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
     "epoch": 3.0,
-    "train_loss": 0.5953705310821533,
-    "train_runtime": 22.7307,
-    "train_samples_per_second": 8.183,
-    "train_steps_per_second": 1.056
 }

 {
     "epoch": 3.0,
+    "train_loss": 0.6169168684217665,
+    "train_runtime": 24.7305,
+    "train_samples_per_second": 7.885,
+    "train_steps_per_second": 1.092
 }

trainer_state.json CHANGED Viewed

@@ -3,26 +3,26 @@
   "best_model_checkpoint": null,
   "epoch": 3.0,
   "eval_steps": 500,
-  "global_step": 24,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
       "epoch": 3.0,
-      "step": 24,
-      "total_flos": 1.4415187272966144e+16,
-      "train_loss": 0.5953705310821533,
-      "train_runtime": 22.7307,
-      "train_samples_per_second": 8.183,
-      "train_steps_per_second": 1.056
     }
   ],
   "logging_steps": 500,
-  "max_steps": 24,
   "num_train_epochs": 3,
   "save_steps": 500,
-  "total_flos": 1.4415187272966144e+16,
   "trial_name": null,
   "trial_params": null
 }

   "best_model_checkpoint": null,
   "epoch": 3.0,
   "eval_steps": 500,
+  "global_step": 27,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
       "epoch": 3.0,
+      "step": 27,
+      "total_flos": 1.511269633456128e+16,
+      "train_loss": 0.6169168684217665,
+      "train_runtime": 24.7305,
+      "train_samples_per_second": 7.885,
+      "train_steps_per_second": 1.092
     }
   ],
   "logging_steps": 500,
+  "max_steps": 27,
   "num_train_epochs": 3,
   "save_steps": 500,
+  "total_flos": 1.511269633456128e+16,
   "trial_name": null,
   "trial_params": null
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e02720ee20fec8b4598a5fba809bb682e12e584fcae6a810511f14d329ec20a9
 size 4536

 version https://git-lfs.github.com/spec/v1
+oid sha256:bcda69e54f5f1cec25cd8381adf4941b7cb79df3e933b22e4d18e5d81434cbe7
 size 4536