nisten commited on
Commit
5d79425
1 Parent(s): 753bbe3

Upload folder using huggingface_hub

Browse files
Files changed (43) hide show
  1. README.md +52 -1
  2. config.json +28 -0
  3. mergekit_config.yml +28 -0
  4. model-00001-of-00035.safetensors +3 -0
  5. model-00002-of-00035.safetensors +3 -0
  6. model-00003-of-00035.safetensors +3 -0
  7. model-00004-of-00035.safetensors +3 -0
  8. model-00005-of-00035.safetensors +3 -0
  9. model-00006-of-00035.safetensors +3 -0
  10. model-00007-of-00035.safetensors +3 -0
  11. model-00008-of-00035.safetensors +3 -0
  12. model-00009-of-00035.safetensors +3 -0
  13. model-00010-of-00035.safetensors +3 -0
  14. model-00011-of-00035.safetensors +3 -0
  15. model-00012-of-00035.safetensors +3 -0
  16. model-00013-of-00035.safetensors +3 -0
  17. model-00014-of-00035.safetensors +3 -0
  18. model-00015-of-00035.safetensors +3 -0
  19. model-00016-of-00035.safetensors +3 -0
  20. model-00017-of-00035.safetensors +3 -0
  21. model-00018-of-00035.safetensors +3 -0
  22. model-00019-of-00035.safetensors +3 -0
  23. model-00020-of-00035.safetensors +3 -0
  24. model-00021-of-00035.safetensors +3 -0
  25. model-00022-of-00035.safetensors +3 -0
  26. model-00023-of-00035.safetensors +3 -0
  27. model-00024-of-00035.safetensors +3 -0
  28. model-00025-of-00035.safetensors +3 -0
  29. model-00026-of-00035.safetensors +3 -0
  30. model-00027-of-00035.safetensors +3 -0
  31. model-00028-of-00035.safetensors +3 -0
  32. model-00029-of-00035.safetensors +3 -0
  33. model-00030-of-00035.safetensors +3 -0
  34. model-00031-of-00035.safetensors +3 -0
  35. model-00032-of-00035.safetensors +3 -0
  36. model-00033-of-00035.safetensors +3 -0
  37. model-00034-of-00035.safetensors +3 -0
  38. model-00035-of-00035.safetensors +3 -0
  39. model.safetensors.index.json +0 -0
  40. special_tokens_map.json +23 -0
  41. tokenizer.json +0 -0
  42. tokenizer.model +3 -0
  43. tokenizer_config.json +41 -0
README.md CHANGED
@@ -1,3 +1,54 @@
1
  ---
2
- license: mit
 
 
 
 
3
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
+ base_model: []
3
+ tags:
4
+ - mergekit
5
+ - merge
6
+
7
  ---
8
+ # BigCodeLLama LFG 🚀
9
+
10
+ ## Experimental CodeLlaMA frankenstein to see how it benchmarks
11
+
12
+ ### Models Merged
13
+
14
+ The following models were included in the merge:
15
+ * ../CodeLlama-70b-hf
16
+ * ../CodeLlama-70b-Instruct-hf
17
+ * ../CodeLlama-70b-Python-hf
18
+
19
+ ### Configuration
20
+
21
+ The following YAML configuration was used to produce this model:
22
+
23
+ ```yaml
24
+ dtype: bfloat16
25
+ merge_method: passthrough
26
+ slices:
27
+ - sources:
28
+ - layer_range: [0, 69]
29
+ model:
30
+ model:
31
+ path: ../CodeLlama-70b-hf
32
+ - sources:
33
+ - layer_range: [66, 76]
34
+ model:
35
+ model:
36
+ path: ../CodeLlama-70b-Instruct-hf
37
+ - sources:
38
+ - layer_range: [42, 66]
39
+ model:
40
+ model:
41
+ path: ../CodeLlama-70b-hf
42
+ - sources:
43
+ - layer_range: [13, 37]
44
+ model:
45
+ model:
46
+ path: ../CodeLlama-70b-Python-hf
47
+ - sources:
48
+ - layer_range: [10, 80]
49
+ model:
50
+ model:
51
+ path: ../CodeLlama-70b-Instruct-hf
52
+ ```
53
+
54
+ ### Stay tuned for GGUFs quants
config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "BigCodeLlama-169b",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 1,
9
+ "eos_token_id": 2,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 8192,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 28672,
14
+ "max_position_embeddings": 16384,
15
+ "model_type": "llama",
16
+ "num_attention_heads": 64,
17
+ "num_hidden_layers": 197,
18
+ "num_key_value_heads": 8,
19
+ "pretraining_tp": 1,
20
+ "rms_norm_eps": 1e-05,
21
+ "rope_scaling": null,
22
+ "rope_theta": 1000000,
23
+ "tie_word_embeddings": false,
24
+ "torch_dtype": "bfloat16",
25
+ "transformers_version": "4.37.2",
26
+ "use_cache": true,
27
+ "vocab_size": 32016
28
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dtype: bfloat16
2
+ merge_method: passthrough
3
+ slices:
4
+ - sources:
5
+ - layer_range: [0, 69]
6
+ model:
7
+ model:
8
+ path: ../CodeLlama-70b-hf
9
+ - sources:
10
+ - layer_range: [66, 76]
11
+ model:
12
+ model:
13
+ path: ../CodeLlama-70b-Instruct-hf
14
+ - sources:
15
+ - layer_range: [42, 66]
16
+ model:
17
+ model:
18
+ path: ../CodeLlama-70b-hf
19
+ - sources:
20
+ - layer_range: [13, 37]
21
+ model:
22
+ model:
23
+ path: ../CodeLlama-70b-Python-hf
24
+ - sources:
25
+ - layer_range: [10, 80]
26
+ model:
27
+ model:
28
+ path: ../CodeLlama-70b-Instruct-hf
model-00001-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2cdf6d49de5bd6cf36ac2ba1934691b637578e15a2545e7303bbd85bf811abb
3
+ size 9852869216
model-00002-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da3cfed04534b57517a985ad7562817357e189df6bc4aa78154db5c8fdcb0ffb
3
+ size 9798096232
model-00003-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0428161bd48d61d51eb3316e3758059f57fbe963670260dc1e590498152e481
3
+ size 9797997992
model-00004-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca65b7cba5706dc35657650ffa552696493e210fcb94afba110474d240a4d34d
3
+ size 9630325192
model-00005-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d9e1443b8809374e42982b52ddeee2a39db9d500df41961d6b737fe0f087222
3
+ size 9798096992
model-00006-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05425f4c273c3c9e51e40315999d6136a49b1038ea8b4b1a83ff2516f3b8b8d7
3
+ size 9798129992
model-00007-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:491f90efbb9c435ea88c7d8e106fe70697a507b8db8406fa6fb3ec40f977e95a
3
+ size 9999423488
model-00008-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdc12500041f01ffd1729b9a8b1fa8fb1dd12773ee26bc304308ce4075060bb0
3
+ size 9965868792
model-00009-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:102e1e2ab7e9beae5ad08f6ec0b3a7809e393bafcd3125ddd5dfdaba9f492c72
3
+ size 9932314128
model-00010-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bec2242b2b0e5d9945c0518af30e2e1bbd2c84dddd602d95b60e50a94fa6a46
3
+ size 9798031016
model-00011-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22d8d0760bd7f9ae65d6cc1de2108674517466ffb3735777db214fc0bd6806eb
3
+ size 9965853000
model-00012-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f5ee6252ebebbb96df56ac025693a135c7d0c6b59ca59935aebe67a6d67e06a
3
+ size 9764559544
model-00013-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb3aecb0bd849f22aabdd5a360d7fb6d228fcf143ecf5e7b0278b8bc709f0237
3
+ size 9798097000
model-00014-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e457102fc56a72492b9e7c8e49f51576108cd4f0326e2a8e8adf08ba8467261
3
+ size 9999423480
model-00015-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:128a39f880167a165c9c5f24ee7eddc6199f3f7b8fba46d6a7eb857b730176d1
3
+ size 9831650944
model-00016-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:966a1dcb03fd6e2739c9c659f1519126885fdf84d2692602a7e7b9fefdba869a
3
+ size 9764541608
model-00017-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2951108e876924b3543d65eebf6a43a64a3763135e6085712aba4b12d9c8b777
3
+ size 9965819992
model-00018-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e01ef782efcd49e1af01bb7d5863613e1094d19528826572758da92898aaa10f
3
+ size 9932282544
model-00019-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b24adb40483a2afd6f9a1a375a876db31e83cb1d52ea20fb8bd96574f39f0d6
3
+ size 9764576040
model-00020-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:874d4940d68b908eeda96cf4e943820ad05e203277033387ba2f5692c49a820a
3
+ size 9831667424
model-00021-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df0e31413836df6eac4870b068bfd4f51da77339e76ce2cfa43b73260105d409
3
+ size 9999439952
model-00022-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af7a106c8f195178d507482327840dd70f290f480d52a75961c836453fe4e733
3
+ size 9798063280
model-00023-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46fc216f7e14908bb68489e5c16e1a1ac8a7c294756d3a0c338c449f53fb10d0
3
+ size 9932297608
model-00024-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fb607ff7fbe20f2324299526cba7cd5f1fab8b28478b2ff30b4cddda9db66d6
3
+ size 9630275672
model-00025-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1bba5bac077377d6334041d476584d8a835435231790ddcfb13f07c21371313
3
+ size 9630292184
model-00026-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93562879bb415f590dddbd357d81039d2e3e930478cde61fe9cded9c7a38f91d
3
+ size 9965885288
model-00027-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73cc2507af8fdbba4876ad913daa67164bf23e2ad4d9fca912745d9f706d4507
3
+ size 9798113472
model-00028-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4118e6ea30d4a291d8e978ae6b7fcf27c5bb25bf81e33eec7514d54c5be8ceac
3
+ size 9999424168
model-00029-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cef6efb8985818333ae7413a911ac5594b3efa72ae4eb98d8a82e51417b4e0ec
3
+ size 9663894912
model-00030-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a546055b84316bdf244c9028e508669314474e24f06775225ad4cc12a829cb16
3
+ size 9764541608
model-00031-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbcde9f1e93113e13923c8c87357d9fcf6788bba40e2eae1b13c9c2ccaf2df0e
3
+ size 9798014496
model-00032-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33a2e5705ed2099ee4d6c52808426ef36b5fc2581b5bfa5622e404aded4d9cf2
3
+ size 9932315528
model-00033-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2368514495d6f9d515252154f3ef8a081221ee8b6a43d37226b06b52a7b0ffc5
3
+ size 9798096992
model-00034-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db982aa39b1ca6576bbf567411746bb8b05119f7f3e224f1d19d469d04dabd16
3
+ size 9697465384
model-00035-of-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:150e94c99a3376ee807539545b5917f402b1085598aee299f76e9b82332f4f30
3
+ size 3779413944
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
special_tokens_map.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "unk_token": {
17
+ "content": "<unk>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ }
23
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99049b351301fb75b3b0587a484b675cbfd51abe27d2b92eabd385e4c41f97e9
3
+ size 500033
tokenizer_config.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
+ "added_tokens_decoder": {
5
+ "0": {
6
+ "content": "<unk>",
7
+ "lstrip": false,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false,
11
+ "special": true
12
+ },
13
+ "1": {
14
+ "content": "<s>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false,
19
+ "special": true
20
+ },
21
+ "2": {
22
+ "content": "</s>",
23
+ "lstrip": false,
24
+ "normalized": false,
25
+ "rstrip": false,
26
+ "single_word": false,
27
+ "special": true
28
+ }
29
+ },
30
+ "bos_token": "<s>",
31
+ "clean_up_tokenization_spaces": false,
32
+ "eos_token": "</s>",
33
+ "legacy": true,
34
+ "model_max_length": 1000000000000000019884624838656,
35
+ "pad_token": null,
36
+ "sp_model_kwargs": {},
37
+ "spaces_between_special_tokens": false,
38
+ "tokenizer_class": "LlamaTokenizer",
39
+ "unk_token": "<unk>",
40
+ "use_default_system_prompt": false
41
+ }