Shubhra Pandit commited on
Commit
fdd6ce2
·
1 Parent(s): beb0f06

Upload model files

Browse files
config.json CHANGED
@@ -26,7 +26,7 @@
26
  "Linear"
27
  ],
28
  "weights": {
29
- "actorder": null,
30
  "block_structure": null,
31
  "dynamic": false,
32
  "group_size": 128,
@@ -179,7 +179,7 @@
179
  "quantization_status": "compressed",
180
  "sparsity_config": {
181
  "format": "dense",
182
- "global_sparsity": 0.15412567029899502,
183
  "ignore": [
184
  "visual.blocks.0.attn.qkv",
185
  "visual.blocks.0.attn.proj",
@@ -893,7 +893,7 @@
893
  "sliding_window": 32768,
894
  "tie_word_embeddings": false,
895
  "torch_dtype": "bfloat16",
896
- "transformers_version": "4.47.1",
897
  "use_cache": true,
898
  "use_sliding_window": false,
899
  "video_token_id": 151656,
@@ -907,4 +907,4 @@
907
  "vision_start_token_id": 151652,
908
  "vision_token_id": 151654,
909
  "vocab_size": 152064
910
- }
 
26
  "Linear"
27
  ],
28
  "weights": {
29
+ "actorder": "weight",
30
  "block_structure": null,
31
  "dynamic": false,
32
  "group_size": 128,
 
179
  "quantization_status": "compressed",
180
  "sparsity_config": {
181
  "format": "dense",
182
+ "global_sparsity": 0.15387583782649714,
183
  "ignore": [
184
  "visual.blocks.0.attn.qkv",
185
  "visual.blocks.0.attn.proj",
 
893
  "sliding_window": 32768,
894
  "tie_word_embeddings": false,
895
  "torch_dtype": "bfloat16",
896
+ "transformers_version": "4.48.3",
897
  "use_cache": true,
898
  "use_sliding_window": false,
899
  "video_token_id": 151656,
 
907
  "vision_start_token_id": 151652,
908
  "vision_token_id": 151654,
909
  "vocab_size": 152064
910
+ }
generation_config.json CHANGED
@@ -9,5 +9,5 @@
9
  "repetition_penalty": 1.05,
10
  "top_k": 1,
11
  "top_p": 0.001,
12
- "transformers_version": "4.48.1"
13
  }
 
9
  "repetition_penalty": 1.05,
10
  "top_k": 1,
11
  "top_p": 0.001,
12
+ "transformers_version": "4.48.3"
13
  }
model-00001-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0aceb9c56fe71793960188acc88db8048a7dba241df591701081d84b63023f8
3
  size 4998143368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:286138bde3d59bca91eea7bb1efe45f678de6ea4674e3c7d4e213c38e83c2d09
3
  size 4998143368
model-00002-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53771ee9263e5fe1b8a5bd97d0b46ef4dcd0ebea8875fd72eebb35d0d6492616
3
  size 4978586536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c84d28a68907590cd62fb410aafd427194b45c29c16fe6a9d3d64f285e6de91
3
  size 4978586536
model-00003-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5103af8f27f1745f65f11ac3af4b62ae709eaf5e5d30abfcda30c5eb18469bb9
3
  size 4978586728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d389dee3d2a836e157b7ddb8c0ce8cb8320ed32b9913789929d9d22dcc71627f
3
  size 4978586728
model-00004-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:268750612712ca03b35171793bf3222cd8832eba974a624a5136467a46d9e46a
3
  size 4978586728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afc5a071f7edcb4d5902fa22745127a25cba404e6f91e69119833d0c74ac673c
3
  size 4978586728
model-00005-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01ffdf53de7def09b55034b7f67b175ffb3997f1cbc8c315ea3258b0bcdbf7d9
3
  size 4978586728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f6209ae402407589dc5cb559e40fca430949167478a589e947bbe2dad59f78c
3
  size 4978586728
model-00006-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:32bd376650c22ee21b584151baf332d174f87983c5fb778da3fd400a5d04e418
3
  size 4978586728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:876b6524f24619ee790de533ac92daabfc95e3e4b1791b58e21e66ffd550259a
3
  size 4978586728
model-00007-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f2f4ef21454d3fc12f18456a5394e2eb87d900851ca4650e1eb5dbaf8120b3a7
3
  size 4978586728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9c56cd8ae875eff1dffc7fc06a307a1e76b5bbb5b4df363b40a215b595349ea
3
  size 4978586728
model-00008-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35cd263f038a68e5bc795139f4a2705c8d42156ae18fa5ddda8b9356db6fb970
3
  size 4978586728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9deb62264eb323eae0a4c228b8e47a0721e01885b35f2a246e26d191357a8c79
3
  size 4978586728
model-00009-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4862d37dd0e87eb89786a3565a8175265258d78a25cba60036f234c0339b5ac2
3
  size 2741257232
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:989e3aaa8d27a6f2ef4ee69339d5beed196c99fb53ab121adbecb3e47f94c9da
3
  size 2741257232
recipe.yaml CHANGED
@@ -2,6 +2,11 @@ DEFAULT_stage:
2
  DEFAULT_modifiers:
3
  GPTQModifier:
4
  sequential_targets: [Qwen2VLDecoderLayer]
5
- scheme: W4A16
 
 
 
 
 
6
  targets: Linear
7
  ignore: [lm_head, 're:visual.*']
 
2
  DEFAULT_modifiers:
3
  GPTQModifier:
4
  sequential_targets: [Qwen2VLDecoderLayer]
5
+ dampening_frac: 0.01
6
+ config_groups:
7
+ config_group:
8
+ targets: [Linear]
9
+ weights: {num_bits: 4, type: int, symmetric: true, group_size: 128, strategy: group,
10
+ dynamic: false, actorder: weight, observer: minmax}
11
  targets: Linear
12
  ignore: [lm_head, 're:visual.*']