Upload folder using huggingface_hub
Browse files- config.json +3 -3
- model.safetensors +2 -2
- recipe.yaml +1 -1
config.json
CHANGED
@@ -32,14 +32,14 @@
|
|
32 |
"num_bits": 8,
|
33 |
"observer": "minmax",
|
34 |
"observer_kwargs": {},
|
35 |
-
"strategy": "
|
36 |
"symmetric": true,
|
37 |
"type": "int"
|
38 |
}
|
39 |
}
|
40 |
},
|
41 |
"format": "int-quantized",
|
42 |
-
"global_compression_ratio": 1.
|
43 |
"ignore": [
|
44 |
"lm_head"
|
45 |
],
|
@@ -48,7 +48,7 @@
|
|
48 |
},
|
49 |
"sparsity_config": {
|
50 |
"format": "dense",
|
51 |
-
"global_sparsity":
|
52 |
"registry_requires_subclass": false,
|
53 |
"sparsity_structure": "unstructured"
|
54 |
}
|
|
|
32 |
"num_bits": 8,
|
33 |
"observer": "minmax",
|
34 |
"observer_kwargs": {},
|
35 |
+
"strategy": "tensor",
|
36 |
"symmetric": true,
|
37 |
"type": "int"
|
38 |
}
|
39 |
}
|
40 |
},
|
41 |
"format": "int-quantized",
|
42 |
+
"global_compression_ratio": 1.2391304140415598,
|
43 |
"ignore": [
|
44 |
"lm_head"
|
45 |
],
|
|
|
48 |
},
|
49 |
"sparsity_config": {
|
50 |
"format": "dense",
|
51 |
+
"global_sparsity": 7.819650685473849,
|
52 |
"registry_requires_subclass": false,
|
53 |
"sparsity_structure": "unstructured"
|
54 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68c532b04501830ec5a92b14272c2cb59b8b419a2c521e57152457fb88243d5c
|
3 |
+
size 1231252556
|
recipe.yaml
CHANGED
@@ -5,6 +5,6 @@ quant_stage:
|
|
5 |
ignore: [lm_head]
|
6 |
config_groups:
|
7 |
group_0:
|
8 |
-
weights: {num_bits: 8, type: int, symmetric: true, strategy:
|
9 |
input_activations: {num_bits: 8, type: int, symmetric: true, dynamic: true, strategy: token}
|
10 |
targets: [Linear]
|
|
|
5 |
ignore: [lm_head]
|
6 |
config_groups:
|
7 |
group_0:
|
8 |
+
weights: {num_bits: 8, type: int, symmetric: true, strategy: tensor}
|
9 |
input_activations: {num_bits: 8, type: int, symmetric: true, dynamic: true, strategy: token}
|
10 |
targets: [Linear]
|