win10 commited on
Commit
13068c2
1 Parent(s): ad86d06

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. README.md +50 -0
  3. added_tokens.json +24 -0
  4. config.json +29 -0
  5. mergekit_config.yml +21 -0
  6. merges.txt +0 -0
  7. model-00001-of-00051.safetensors +3 -0
  8. model-00002-of-00051.safetensors +3 -0
  9. model-00003-of-00051.safetensors +3 -0
  10. model-00004-of-00051.safetensors +3 -0
  11. model-00005-of-00051.safetensors +3 -0
  12. model-00006-of-00051.safetensors +3 -0
  13. model-00007-of-00051.safetensors +3 -0
  14. model-00008-of-00051.safetensors +3 -0
  15. model-00009-of-00051.safetensors +3 -0
  16. model-00010-of-00051.safetensors +3 -0
  17. model-00011-of-00051.safetensors +3 -0
  18. model-00012-of-00051.safetensors +3 -0
  19. model-00013-of-00051.safetensors +3 -0
  20. model-00014-of-00051.safetensors +3 -0
  21. model-00015-of-00051.safetensors +3 -0
  22. model-00016-of-00051.safetensors +3 -0
  23. model-00017-of-00051.safetensors +3 -0
  24. model-00018-of-00051.safetensors +3 -0
  25. model-00019-of-00051.safetensors +3 -0
  26. model-00020-of-00051.safetensors +3 -0
  27. model-00021-of-00051.safetensors +3 -0
  28. model-00022-of-00051.safetensors +3 -0
  29. model-00023-of-00051.safetensors +3 -0
  30. model-00024-of-00051.safetensors +3 -0
  31. model-00025-of-00051.safetensors +3 -0
  32. model-00026-of-00051.safetensors +3 -0
  33. model-00027-of-00051.safetensors +3 -0
  34. model-00028-of-00051.safetensors +3 -0
  35. model-00029-of-00051.safetensors +3 -0
  36. model-00030-of-00051.safetensors +3 -0
  37. model-00031-of-00051.safetensors +3 -0
  38. model-00032-of-00051.safetensors +3 -0
  39. model-00033-of-00051.safetensors +3 -0
  40. model-00034-of-00051.safetensors +3 -0
  41. model-00035-of-00051.safetensors +3 -0
  42. model-00036-of-00051.safetensors +3 -0
  43. model-00037-of-00051.safetensors +3 -0
  44. model-00038-of-00051.safetensors +3 -0
  45. model-00039-of-00051.safetensors +3 -0
  46. model-00040-of-00051.safetensors +3 -0
  47. model-00041-of-00051.safetensors +3 -0
  48. model-00042-of-00051.safetensors +3 -0
  49. model-00043-of-00051.safetensors +3 -0
  50. model-00044-of-00051.safetensors +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model:
3
+ - Qwen/Qwen2.5-Coder-7B-Instruct
4
+ library_name: transformers
5
+ tags:
6
+ - mergekit
7
+ - merge
8
+
9
+ ---
10
+ # merge
11
+
12
+ This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
13
+
14
+ ## Merge Details
15
+ ### Merge Method
16
+
17
+ This model was merged using the passthrough merge method.
18
+
19
+ ### Models Merged
20
+
21
+ The following models were included in the merge:
22
+ * [Qwen/Qwen2.5-Coder-7B-Instruct](https://huggingface.co/Qwen/Qwen2.5-Coder-7B-Instruct)
23
+
24
+ ### Configuration
25
+
26
+ The following YAML configuration was used to produce this model:
27
+
28
+ ```yaml
29
+ dtype: bfloat16
30
+ merge_method: passthrough
31
+ slices:
32
+ - sources:
33
+ - layer_range: [0, 8]
34
+ model: Qwen/Qwen2.5-Coder-7B-Instruct
35
+ - sources:
36
+ - layer_range: [4, 12]
37
+ model: Qwen/Qwen2.5-Coder-7B-Instruct
38
+ - sources:
39
+ - layer_range: [8, 16]
40
+ model: Qwen/Qwen2.5-Coder-7B-Instruct
41
+ - sources:
42
+ - layer_range: [12, 20]
43
+ model: Qwen/Qwen2.5-Coder-7B-Instruct
44
+ - sources:
45
+ - layer_range: [16, 24]
46
+ model: Qwen/Qwen2.5-Coder-7B-Instruct
47
+ - sources:
48
+ - layer_range: [20, 28]
49
+ model: Qwen/Qwen2.5-Coder-7B-Instruct
50
+ ```
added_tokens.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "</tool_call>": 151658,
3
+ "<tool_call>": 151657,
4
+ "<|box_end|>": 151649,
5
+ "<|box_start|>": 151648,
6
+ "<|endoftext|>": 151643,
7
+ "<|file_sep|>": 151664,
8
+ "<|fim_middle|>": 151660,
9
+ "<|fim_pad|>": 151662,
10
+ "<|fim_prefix|>": 151659,
11
+ "<|fim_suffix|>": 151661,
12
+ "<|im_end|>": 151645,
13
+ "<|im_start|>": 151644,
14
+ "<|image_pad|>": 151655,
15
+ "<|object_ref_end|>": 151647,
16
+ "<|object_ref_start|>": 151646,
17
+ "<|quad_end|>": 151651,
18
+ "<|quad_start|>": 151650,
19
+ "<|repo_name|>": 151663,
20
+ "<|video_pad|>": 151656,
21
+ "<|vision_end|>": 151653,
22
+ "<|vision_pad|>": 151654,
23
+ "<|vision_start|>": 151652
24
+ }
config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "Qwen/Qwen2.5-Coder-7B-Instruct",
3
+ "architectures": [
4
+ "Qwen2ForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 151643,
8
+ "eos_token_id": 151645,
9
+ "hidden_act": "silu",
10
+ "hidden_size": 3584,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 18944,
13
+ "max_position_embeddings": 32768,
14
+ "max_window_layers": 28,
15
+ "model_type": "qwen2",
16
+ "num_attention_heads": 28,
17
+ "num_hidden_layers": 48,
18
+ "num_key_value_heads": 4,
19
+ "rms_norm_eps": 1e-06,
20
+ "rope_scaling": null,
21
+ "rope_theta": 1000000.0,
22
+ "sliding_window": null,
23
+ "tie_word_embeddings": false,
24
+ "torch_dtype": "bfloat16",
25
+ "transformers_version": "4.45.2",
26
+ "use_cache": true,
27
+ "use_sliding_window": false,
28
+ "vocab_size": 152064
29
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dtype: bfloat16
2
+ merge_method: passthrough
3
+ slices:
4
+ - sources:
5
+ - layer_range: [0, 8]
6
+ model: Qwen/Qwen2.5-Coder-7B-Instruct
7
+ - sources:
8
+ - layer_range: [4, 12]
9
+ model: Qwen/Qwen2.5-Coder-7B-Instruct
10
+ - sources:
11
+ - layer_range: [8, 16]
12
+ model: Qwen/Qwen2.5-Coder-7B-Instruct
13
+ - sources:
14
+ - layer_range: [12, 20]
15
+ model: Qwen/Qwen2.5-Coder-7B-Instruct
16
+ - sources:
17
+ - layer_range: [16, 24]
18
+ model: Qwen/Qwen2.5-Coder-7B-Instruct
19
+ - sources:
20
+ - layer_range: [20, 28]
21
+ model: Qwen/Qwen2.5-Coder-7B-Instruct
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5aa6e5cbe642377fd441fb4e60e83cca96b2bcd9820e245b9ea06d94653f17f2
3
+ size 1089994880
model-00002-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26cac15f69a0986aa527db661257174afd8c6cc8ccb4e937bdedfaad76775ed4
3
+ size 1089994896
model-00003-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fca0545f38f5c06dfcab0739750941ade6e693cced38a0403bc509e4eb6b400
3
+ size 466124232
model-00004-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0247ad966756ae850ea0599f0a56fd5eb9e16d309bc432ac9d8be2e0caa33573
3
+ size 466124240
model-00005-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97806220487297216a97b7e3a6333eb5d0fb6802fcfe336eb703fe8a5ebd8a61
3
+ size 407372152
model-00006-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df655df5f41fd724fc9779042260ed3d5e8bc005409ca6c3a6ca03e64ddd4b5f
3
+ size 491814488
model-00007-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c54aa8e1a2ae9990938da66f8513351d4ba2e6f3edcea9b131ca2d0d98ae5aa5
3
+ size 440419456
model-00008-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87f339f486a06afd190e631e04f5b53fd8bf9b29cd9de7524636a65d9dcdfdbe
3
+ size 491814488
model-00009-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:515e3f56cf81c17b9578b115b0213d3d9b9f379a3a399108169464f0e67d3869
3
+ size 440419448
model-00010-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:406dd666f3ebe2117e92b4b5cd47c4502fab106eea90f69bc878e042a3caa870
3
+ size 491814488
model-00011-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3df9d209fb4bac4dae8c0c36b027ddc0b3b279aecb76506cbe425d8dc22c6eb7
3
+ size 440419456
model-00012-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a707f7ad5059e07d7fa38136e1a4875b9f10868a89be8cbb29c91d5fceb0d7a
3
+ size 491814488
model-00013-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e83043361f5fed62551294e4ba5f573d4316e8997e44168811d49e3b6e98337a
3
+ size 440419456
model-00014-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:074ad51506d6f05f397a33fa0367b17ae5c9138b33b8787b7fef928a376f0b89
3
+ size 491814488
model-00015-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf09f5895ba09ea612e3e592e2139bed3bf0e24bee70f353d66e72336b977a92
3
+ size 440419456
model-00016-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7c50d41b7ad145f712eb0bfa6fdbb85b217dd4d9ce47bc49cede71685f5a429
3
+ size 491814488
model-00017-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0c8ef07ab28b64db222845fc4d32f799dd0e511191403d4860e91fa6f79dc08
3
+ size 440419448
model-00018-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:900c060e20f59ae0c627af24906f017e745aeb60616a601da1b91429108bb763
3
+ size 491814488
model-00019-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a407a32754ef43e81b46f77ce9b6f990dea55bc9253119049bc2acc34b9fe447
3
+ size 440419456
model-00020-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1388307a1d901e60ab02a58d2b946623a2f379d89a8f0d90d9a9dff8ff62e61b
3
+ size 491814488
model-00021-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f1159883528c6f8d6dd623604debc0746c767b4ffe6d17afd477199f4af39f8
3
+ size 440419456
model-00022-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7e43a2f7c9b786f2c8229cd3e134d1c365f05f6c415fc40815d7a46f701ef3a
3
+ size 491814488
model-00023-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4d3bc9675db52ea057e27fc478d994a3365d63185939a65ec2be817dc990605
3
+ size 440419456
model-00024-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:263b9a8b58bda9ad994b6198f6fad51c1a0b702d2dfd294b130eeb87fdf0c544
3
+ size 491814488
model-00025-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f280bcb2271d1851684ee6bca82ad10fee6d595334a904c73501a5ca6da9fdb
3
+ size 499164264
model-00026-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78c522bb70719892d9f51d7930266ff185fc4c43bf70f18b72036fa7749aa7bb
3
+ size 407372152
model-00027-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d579ed4275943b25e071a0c08e83dada84e0631236aaa6258b4e3ffa7f2557e3
3
+ size 491814488
model-00028-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7e5da34a9a1087170a77aa7438553daeb5a7f96dd91486433b60782e720a123
3
+ size 440419456
model-00029-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edf58eeb0c32210c9f344ed950df2f01274013cb52b9f76d0e4caa45c3ae108c
3
+ size 491814488
model-00030-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fe479305538759d1832cc9826daabd41dc4dffcd8bb414d73606e48fc44e15c
3
+ size 440419456
model-00031-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1722ceffb28708d761c6a5b93facc337e545a3611f37df67a974ee408b8a228d
3
+ size 491814488
model-00032-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ddb2d27807107522662a1db18e576baccd31433af6e348f324fc297c18ac418
3
+ size 440419456
model-00033-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0560c744962f9d9b8f12bc23f08d074b95cc8bf99bb9cf3fd5c0109bfbb8b613
3
+ size 491814488
model-00034-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4406a27289d026e887ac2722959b4a01d6bf759fb9cce1b260dc916b7ec7449
3
+ size 499156992
model-00035-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdae7538918bae524a8136dd96a2868b9718e649b237f8d89c5e8b0cb9aed461
3
+ size 466116976
model-00036-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36c5c1a6d8281189cf2b3a83d53ce7806d85249dba1fffe0fc2f68b209ffd849
3
+ size 466116976
model-00037-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b13da128d53107fab10a65148fb869fb4303c31c35b15a316906efbc55011809
3
+ size 466116968
model-00038-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e06afba170753878b64b3a131977f1289331fd6c5db00414ceacef5625c97ae
3
+ size 466124240
model-00039-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f20c280710e887f050822c27d614da7aa2de01501faa8bfa4585b5a98665551
3
+ size 407372152
model-00040-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fae556b2278a452b0d9e52f21ccda5f3acaeb44ec29dbfe9f2345bd49efc360
3
+ size 491814472
model-00041-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d009865f805749afb0ad5a5b7d3a9f202e686aa13f7d4b9776228374ac2398e
3
+ size 440419448
model-00042-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e424561d4580e83e96044c6332a02d839ed4544075dcfd884dfbab4e504a1259
3
+ size 491814472
model-00043-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ae1f81f9c6aa9b671ab45e9e8dfa7cae4249b202ca6ff9d57ddd28f7a5f1de3
3
+ size 440419448
model-00044-of-00051.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c31bb72e57f1dbabdb52b71b935b30850e6f6729c660c515d5515c41ba77d52c
3
+ size 491814480