sadkins65 commited on
Commit
949d397
1 Parent(s): 393d709

Upload folder using huggingface_hub

Browse files
Files changed (3) hide show
  1. config.json +3 -3
  2. model.safetensors +2 -2
  3. recipe.yaml +1 -1
config.json CHANGED
@@ -32,14 +32,14 @@
32
  "num_bits": 8,
33
  "observer": "minmax",
34
  "observer_kwargs": {},
35
- "strategy": "channel",
36
  "symmetric": true,
37
  "type": "int"
38
  }
39
  }
40
  },
41
  "format": "int-quantized",
42
- "global_compression_ratio": 1.2390773684863086,
43
  "ignore": [
44
  "lm_head"
45
  ],
@@ -48,7 +48,7 @@
48
  },
49
  "sparsity_config": {
50
  "format": "dense",
51
- "global_sparsity": 1.188444907528722,
52
  "registry_requires_subclass": false,
53
  "sparsity_structure": "unstructured"
54
  }
 
32
  "num_bits": 8,
33
  "observer": "minmax",
34
  "observer_kwargs": {},
35
+ "strategy": "tensor",
36
  "symmetric": true,
37
  "type": "int"
38
  }
39
  }
40
  },
41
  "format": "int-quantized",
42
+ "global_compression_ratio": 1.2391304140415598,
43
  "ignore": [
44
  "lm_head"
45
  ],
 
48
  },
49
  "sparsity_config": {
50
  "format": "dense",
51
+ "global_sparsity": 7.819650685473849,
52
  "registry_requires_subclass": false,
53
  "sparsity_structure": "unstructured"
54
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed7796316a087eaf71963e35ff79ae097d02000411fc834b315d0bf399ad870c
3
- size 1232041608
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68c532b04501830ec5a92b14272c2cb59b8b419a2c521e57152457fb88243d5c
3
+ size 1231252556
recipe.yaml CHANGED
@@ -5,6 +5,6 @@ quant_stage:
5
  ignore: [lm_head]
6
  config_groups:
7
  group_0:
8
- weights: {num_bits: 8, type: int, symmetric: true, strategy: channel}
9
  input_activations: {num_bits: 8, type: int, symmetric: true, dynamic: true, strategy: token}
10
  targets: [Linear]
 
5
  ignore: [lm_head]
6
  config_groups:
7
  group_0:
8
+ weights: {num_bits: 8, type: int, symmetric: true, strategy: tensor}
9
  input_activations: {num_bits: 8, type: int, symmetric: true, dynamic: true, strategy: token}
10
  targets: [Linear]