yhyhy3 commited on
Commit
2a220ba
1 Parent(s): 47a693f

Add model files and configs

Browse files
all_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 3.0,
3
- "train_loss": 0.5636956691741943,
4
- "train_runtime": 22.0278,
5
- "train_samples_per_second": 8.444,
6
- "train_steps_per_second": 1.09
7
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "train_loss": 0.5953705310821533,
4
+ "train_runtime": 22.7307,
5
+ "train_samples_per_second": 8.183,
6
+ "train_steps_per_second": 1.056
7
  }
onnx/model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6be8652642ea8552c3f501ed1c58b2a72737f97a68d2a1b31dc143d151eb9b45
3
  size 87112360
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6a382ddc11e568915fa205c55174e03550e69c4a0f771a5899549a6a952a5d3
3
  size 87112360
quantize_config.json CHANGED
@@ -4,30 +4,30 @@
4
  "per_model_config": {
5
  "model": {
6
  "op_types": [
7
- "Slice",
8
  "Sqrt",
 
 
 
 
 
 
9
  "Gemm",
10
- "Shape",
11
  "ReduceMean",
12
- "Constant",
13
- "Reshape",
14
- "Equal",
15
- "MatMul",
16
- "Mul",
17
  "Unsqueeze",
18
- "Where",
19
- "Erf",
20
- "Pow",
21
  "Softmax",
22
- "Transpose",
23
  "Add",
24
- "Conv",
25
- "ConstantOfShape",
26
- "Expand",
27
- "Div",
28
- "Concat",
29
- "Gather",
30
- "Sub"
 
31
  ],
32
  "weight_type": "QUInt8"
33
  }
 
4
  "per_model_config": {
5
  "model": {
6
  "op_types": [
7
+ "MatMul",
8
  "Sqrt",
9
+ "ConstantOfShape",
10
+ "Mul",
11
+ "Concat",
12
+ "Gather",
13
+ "Transpose",
14
+ "Expand",
15
  "Gemm",
16
+ "Div",
17
  "ReduceMean",
18
+ "Conv",
 
 
 
 
19
  "Unsqueeze",
20
+ "Sub",
 
 
21
  "Softmax",
 
22
  "Add",
23
+ "Slice",
24
+ "Pow",
25
+ "Erf",
26
+ "Where",
27
+ "Constant",
28
+ "Reshape",
29
+ "Shape",
30
+ "Equal"
31
  ],
32
  "weight_type": "QUInt8"
33
  }
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 3.0,
3
- "train_loss": 0.5636956691741943,
4
- "train_runtime": 22.0278,
5
- "train_samples_per_second": 8.444,
6
- "train_steps_per_second": 1.09
7
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "train_loss": 0.5953705310821533,
4
+ "train_runtime": 22.7307,
5
+ "train_samples_per_second": 8.183,
6
+ "train_steps_per_second": 1.056
7
  }
trainer_state.json CHANGED
@@ -12,10 +12,10 @@
12
  "epoch": 3.0,
13
  "step": 24,
14
  "total_flos": 1.4415187272966144e+16,
15
- "train_loss": 0.5636956691741943,
16
- "train_runtime": 22.0278,
17
- "train_samples_per_second": 8.444,
18
- "train_steps_per_second": 1.09
19
  }
20
  ],
21
  "logging_steps": 500,
 
12
  "epoch": 3.0,
13
  "step": 24,
14
  "total_flos": 1.4415187272966144e+16,
15
+ "train_loss": 0.5953705310821533,
16
+ "train_runtime": 22.7307,
17
+ "train_samples_per_second": 8.183,
18
+ "train_steps_per_second": 1.056
19
  }
20
  ],
21
  "logging_steps": 500,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:05921028ea1d9a15207f7bdfd50062ae83d562fa4e1aa0f49ed1af08fd4888eb
3
  size 4536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e02720ee20fec8b4598a5fba809bb682e12e584fcae6a810511f14d329ec20a9
3
  size 4536