Mihaiii commited on
Commit
e28503c
·
verified ·
1 Parent(s): 871df39

Upload 8 files

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "TaylorAI/bge-micro",
3
  "architectures": [
4
  "BertModel"
5
  ],
@@ -23,7 +23,6 @@
23
  "num_hidden_layers": 3,
24
  "pad_token_id": 0,
25
  "position_embedding_type": "absolute",
26
- "torch_dtype": "float16",
27
  "transformers_version": "4.40.1",
28
  "type_vocab_size": 2,
29
  "use_cache": true,
 
1
  {
2
+ "_name_or_path": "Mihaiii/Kyurem",
3
  "architectures": [
4
  "BertModel"
5
  ],
 
23
  "num_hidden_layers": 3,
24
  "pad_token_id": 0,
25
  "position_embedding_type": "absolute",
 
26
  "transformers_version": "4.40.1",
27
  "type_vocab_size": 2,
28
  "use_cache": true,
onnx/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92c779d76ee87075794412db4c0bab996f9cac4dbdda79009d5daca5e7364f27
3
+ size 69035106
onnx/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1c4b2bcc49d74156a96f9c76e4de57329550618dd11d60bc3039ef4f80a5da9
3
+ size 17452601
quantize_config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "model": {
6
+ "op_types": [
7
+ "Constant",
8
+ "Concat",
9
+ "ReduceMean",
10
+ "Reshape",
11
+ "Cast",
12
+ "Transpose",
13
+ "Sub",
14
+ "Mul",
15
+ "Shape",
16
+ "Sqrt",
17
+ "Pow",
18
+ "Erf",
19
+ "Gather",
20
+ "MatMul",
21
+ "Unsqueeze",
22
+ "Softmax",
23
+ "Slice",
24
+ "Div",
25
+ "Add"
26
+ ],
27
+ "weight_type": "QInt8"
28
+ }
29
+ }
30
+ }