Shubhra Pandit
commited on
Commit
·
fdd6ce2
1
Parent(s):
beb0f06
Upload model files
Browse files- config.json +4 -4
- generation_config.json +1 -1
- model-00001-of-00009.safetensors +1 -1
- model-00002-of-00009.safetensors +1 -1
- model-00003-of-00009.safetensors +1 -1
- model-00004-of-00009.safetensors +1 -1
- model-00005-of-00009.safetensors +1 -1
- model-00006-of-00009.safetensors +1 -1
- model-00007-of-00009.safetensors +1 -1
- model-00008-of-00009.safetensors +1 -1
- model-00009-of-00009.safetensors +1 -1
- recipe.yaml +6 -1
config.json
CHANGED
@@ -26,7 +26,7 @@
|
|
26 |
"Linear"
|
27 |
],
|
28 |
"weights": {
|
29 |
-
"actorder":
|
30 |
"block_structure": null,
|
31 |
"dynamic": false,
|
32 |
"group_size": 128,
|
@@ -179,7 +179,7 @@
|
|
179 |
"quantization_status": "compressed",
|
180 |
"sparsity_config": {
|
181 |
"format": "dense",
|
182 |
-
"global_sparsity": 0.
|
183 |
"ignore": [
|
184 |
"visual.blocks.0.attn.qkv",
|
185 |
"visual.blocks.0.attn.proj",
|
@@ -893,7 +893,7 @@
|
|
893 |
"sliding_window": 32768,
|
894 |
"tie_word_embeddings": false,
|
895 |
"torch_dtype": "bfloat16",
|
896 |
-
"transformers_version": "4.
|
897 |
"use_cache": true,
|
898 |
"use_sliding_window": false,
|
899 |
"video_token_id": 151656,
|
@@ -907,4 +907,4 @@
|
|
907 |
"vision_start_token_id": 151652,
|
908 |
"vision_token_id": 151654,
|
909 |
"vocab_size": 152064
|
910 |
-
}
|
|
|
26 |
"Linear"
|
27 |
],
|
28 |
"weights": {
|
29 |
+
"actorder": "weight",
|
30 |
"block_structure": null,
|
31 |
"dynamic": false,
|
32 |
"group_size": 128,
|
|
|
179 |
"quantization_status": "compressed",
|
180 |
"sparsity_config": {
|
181 |
"format": "dense",
|
182 |
+
"global_sparsity": 0.15387583782649714,
|
183 |
"ignore": [
|
184 |
"visual.blocks.0.attn.qkv",
|
185 |
"visual.blocks.0.attn.proj",
|
|
|
893 |
"sliding_window": 32768,
|
894 |
"tie_word_embeddings": false,
|
895 |
"torch_dtype": "bfloat16",
|
896 |
+
"transformers_version": "4.48.3",
|
897 |
"use_cache": true,
|
898 |
"use_sliding_window": false,
|
899 |
"video_token_id": 151656,
|
|
|
907 |
"vision_start_token_id": 151652,
|
908 |
"vision_token_id": 151654,
|
909 |
"vocab_size": 152064
|
910 |
+
}
|
generation_config.json
CHANGED
@@ -9,5 +9,5 @@
|
|
9 |
"repetition_penalty": 1.05,
|
10 |
"top_k": 1,
|
11 |
"top_p": 0.001,
|
12 |
-
"transformers_version": "4.48.
|
13 |
}
|
|
|
9 |
"repetition_penalty": 1.05,
|
10 |
"top_k": 1,
|
11 |
"top_p": 0.001,
|
12 |
+
"transformers_version": "4.48.3"
|
13 |
}
|
model-00001-of-00009.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4998143368
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:286138bde3d59bca91eea7bb1efe45f678de6ea4674e3c7d4e213c38e83c2d09
|
3 |
size 4998143368
|
model-00002-of-00009.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4978586536
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c84d28a68907590cd62fb410aafd427194b45c29c16fe6a9d3d64f285e6de91
|
3 |
size 4978586536
|
model-00003-of-00009.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4978586728
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d389dee3d2a836e157b7ddb8c0ce8cb8320ed32b9913789929d9d22dcc71627f
|
3 |
size 4978586728
|
model-00004-of-00009.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4978586728
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afc5a071f7edcb4d5902fa22745127a25cba404e6f91e69119833d0c74ac673c
|
3 |
size 4978586728
|
model-00005-of-00009.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4978586728
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f6209ae402407589dc5cb559e40fca430949167478a589e947bbe2dad59f78c
|
3 |
size 4978586728
|
model-00006-of-00009.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4978586728
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:876b6524f24619ee790de533ac92daabfc95e3e4b1791b58e21e66ffd550259a
|
3 |
size 4978586728
|
model-00007-of-00009.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4978586728
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9c56cd8ae875eff1dffc7fc06a307a1e76b5bbb5b4df363b40a215b595349ea
|
3 |
size 4978586728
|
model-00008-of-00009.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4978586728
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9deb62264eb323eae0a4c228b8e47a0721e01885b35f2a246e26d191357a8c79
|
3 |
size 4978586728
|
model-00009-of-00009.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2741257232
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:989e3aaa8d27a6f2ef4ee69339d5beed196c99fb53ab121adbecb3e47f94c9da
|
3 |
size 2741257232
|
recipe.yaml
CHANGED
@@ -2,6 +2,11 @@ DEFAULT_stage:
|
|
2 |
DEFAULT_modifiers:
|
3 |
GPTQModifier:
|
4 |
sequential_targets: [Qwen2VLDecoderLayer]
|
5 |
-
|
|
|
|
|
|
|
|
|
|
|
6 |
targets: Linear
|
7 |
ignore: [lm_head, 're:visual.*']
|
|
|
2 |
DEFAULT_modifiers:
|
3 |
GPTQModifier:
|
4 |
sequential_targets: [Qwen2VLDecoderLayer]
|
5 |
+
dampening_frac: 0.01
|
6 |
+
config_groups:
|
7 |
+
config_group:
|
8 |
+
targets: [Linear]
|
9 |
+
weights: {num_bits: 4, type: int, symmetric: true, group_size: 128, strategy: group,
|
10 |
+
dynamic: false, actorder: weight, observer: minmax}
|
11 |
targets: Linear
|
12 |
ignore: [lm_head, 're:visual.*']
|