abhishek3jangid
commited on
Commit
•
1df732f
1
Parent(s):
5faf92d
Initial upload
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +40 -0
- generation_config.json +12 -0
- model-00001-of-00062.safetensors +3 -0
- model-00002-of-00062.safetensors +3 -0
- model-00003-of-00062.safetensors +3 -0
- model-00004-of-00062.safetensors +3 -0
- model-00005-of-00062.safetensors +3 -0
- model-00006-of-00062.safetensors +3 -0
- model-00007-of-00062.safetensors +3 -0
- model-00008-of-00062.safetensors +3 -0
- model-00009-of-00062.safetensors +3 -0
- model-00010-of-00062.safetensors +3 -0
- model-00011-of-00062.safetensors +3 -0
- model-00012-of-00062.safetensors +3 -0
- model-00013-of-00062.safetensors +3 -0
- model-00014-of-00062.safetensors +3 -0
- model-00015-of-00062.safetensors +3 -0
- model-00016-of-00062.safetensors +3 -0
- model-00017-of-00062.safetensors +3 -0
- model-00018-of-00062.safetensors +3 -0
- model-00019-of-00062.safetensors +3 -0
- model-00020-of-00062.safetensors +3 -0
- model-00021-of-00062.safetensors +3 -0
- model-00022-of-00062.safetensors +3 -0
- model-00023-of-00062.safetensors +3 -0
- model-00024-of-00062.safetensors +3 -0
- model-00025-of-00062.safetensors +3 -0
- model-00026-of-00062.safetensors +3 -0
- model-00027-of-00062.safetensors +3 -0
- model-00028-of-00062.safetensors +3 -0
- model-00029-of-00062.safetensors +3 -0
- model-00030-of-00062.safetensors +3 -0
- model-00031-of-00062.safetensors +3 -0
- model-00032-of-00062.safetensors +3 -0
- model-00033-of-00062.safetensors +3 -0
- model-00034-of-00062.safetensors +3 -0
- model-00035-of-00062.safetensors +3 -0
- model-00036-of-00062.safetensors +3 -0
- model-00037-of-00062.safetensors +3 -0
- model-00038-of-00062.safetensors +3 -0
- model-00039-of-00062.safetensors +3 -0
- model-00040-of-00062.safetensors +3 -0
- model-00041-of-00062.safetensors +3 -0
- model-00042-of-00062.safetensors +3 -0
- model-00043-of-00062.safetensors +3 -0
- model-00044-of-00062.safetensors +3 -0
- model-00045-of-00062.safetensors +3 -0
- model-00046-of-00062.safetensors +3 -0
- model-00047-of-00062.safetensors +3 -0
- model-00048-of-00062.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "meta-llama/Llama-3.1-70B-Instruct",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": [
|
10 |
+
128001,
|
11 |
+
128008,
|
12 |
+
128009
|
13 |
+
],
|
14 |
+
"head_dim": 128,
|
15 |
+
"hidden_act": "silu",
|
16 |
+
"hidden_size": 8192,
|
17 |
+
"initializer_range": 0.02,
|
18 |
+
"intermediate_size": 28672,
|
19 |
+
"max_position_embeddings": 131072,
|
20 |
+
"mlp_bias": false,
|
21 |
+
"model_type": "llama",
|
22 |
+
"num_attention_heads": 64,
|
23 |
+
"num_hidden_layers": 80,
|
24 |
+
"num_key_value_heads": 8,
|
25 |
+
"pretraining_tp": 1,
|
26 |
+
"rms_norm_eps": 1e-05,
|
27 |
+
"rope_scaling": {
|
28 |
+
"factor": 8.0,
|
29 |
+
"high_freq_factor": 4.0,
|
30 |
+
"low_freq_factor": 1.0,
|
31 |
+
"original_max_position_embeddings": 8192,
|
32 |
+
"rope_type": "llama3"
|
33 |
+
},
|
34 |
+
"rope_theta": 500000.0,
|
35 |
+
"tie_word_embeddings": false,
|
36 |
+
"torch_dtype": "float32",
|
37 |
+
"transformers_version": "4.46.3",
|
38 |
+
"use_cache": false,
|
39 |
+
"vocab_size": 128256
|
40 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 128000,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
128001,
|
6 |
+
128008,
|
7 |
+
128009
|
8 |
+
],
|
9 |
+
"temperature": 0.6,
|
10 |
+
"top_p": 0.9,
|
11 |
+
"transformers_version": "4.46.3"
|
12 |
+
}
|
model-00001-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:995918030d8ff5acbd5cdde18276596d0afaf5c68369bcab7aa1f44fb65be2c2
|
3 |
+
size 4806672984
|
model-00002-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d9da25bd05ffcd9f66a161233f75b85329491d34458ef9c3473c2991fcf4968
|
3 |
+
size 4362142864
|
model-00003-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98abb2a303ea166336690957ad5dcd0bcfbd28d322834c67cef15ee2167ac32a
|
3 |
+
size 4362142864
|
model-00004-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:119c68bd67289c53f70fedda23195fd10792f23e2983237020de9f1907638206
|
3 |
+
size 4966188864
|
model-00005-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ae41491e31f3039bba9544b1ae83a6927b39bc4608bbd7a304d96fb9e12d8d4
|
3 |
+
size 4362142864
|
model-00006-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a62f91122a6351b638cf8062d91a9d65f88a7c1ab6ef4a7589e8ab1fc4631796
|
3 |
+
size 4362142864
|
model-00007-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0af954666c818986f8c467de08d4cf62e5bd9b9b85b57e04288e40208d7c573
|
3 |
+
size 4966188864
|
model-00008-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5de6f61bd5e105a9247caf036b566a72a7f1e7de7c286efb84d0e52cf536fc7
|
3 |
+
size 4362142864
|
model-00009-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:105098a40517be8a19f2690c1803eeb7558d29a26636170641b164610ee84d94
|
3 |
+
size 4362142880
|
model-00010-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69a7b7f70950a501c61fbb3d707140ebc11a498f60232757ef351792366b05b5
|
3 |
+
size 4966188880
|
model-00011-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6faf10394af7a5fa1b06f14285bda7772ccbcabd9a2913ba7c9187dccfdeae29
|
3 |
+
size 4362142872
|
model-00012-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5332ca9241f2be64e8cf02d066ae0a39328d9b0ed9e0ccb4d8a81f2a9e9e75a0
|
3 |
+
size 4362142872
|
model-00013-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6900e7eb8acd45360efca8536f21835b4098e79a16eef01ed90f3aa2eb569c0
|
3 |
+
size 4966188880
|
model-00014-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:523b8a098bc5d92d33c77404813b22fcae38dc4c3cc694487643b06437425510
|
3 |
+
size 4362142872
|
model-00015-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb27241aa3ac8a1271096064f37fa872777b68e39be30e1f3dfdecad63564c20
|
3 |
+
size 4362142872
|
model-00016-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54b1f61de35e62ee4b38ab2032fc0c950ebb60fa1d52a96ecd63fad0940fd5ee
|
3 |
+
size 4966188880
|
model-00017-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abadee78a10b8ff56c0c7c4843c8f4d6662a108e2ebbd7bd2b9e3056acec5962
|
3 |
+
size 4362142872
|
model-00018-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33cbc431d69aa3557d5ae26d2910f02ecb0ae59449fafb891f6a4cf7e14418fd
|
3 |
+
size 4362142872
|
model-00019-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:090d0ece08a734122f48769e1e6b57a2ff65f181decca05f1b6c47b94d8f702d
|
3 |
+
size 4966188880
|
model-00020-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68952eb6da619cff07e6c2a0ea2cfb9e0fe6a475a623c679cdfe20fc5c1651d3
|
3 |
+
size 4362142872
|
model-00021-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3bcf49cc7b5c3840c7108cc0f2ec433cd168b2ebc95d444f8d7d38efc817dc8
|
3 |
+
size 4362142872
|
model-00022-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae1fdd2d31e643b1484eb8d32dc85a68c1460c2caf2ed47c94ff190df2f0f212
|
3 |
+
size 4966188880
|
model-00023-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80b006c71886fa988b121d6d929721b13db9ff08e2f91f90989633d4dae8b0e7
|
3 |
+
size 4362142872
|
model-00024-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:206b24d72de979d306c4c2d93bdb509a6360f16306617b445552bfe01c3d4dc6
|
3 |
+
size 4362142872
|
model-00025-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40f561af8b9c94202c3b19f44b50c49b0b436ccb7a90e3f5feff336422734f0a
|
3 |
+
size 4966188880
|
model-00026-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4977dd0840419f59866da90d0d750d0d7477765d31b22f49608775e5f50c99a2
|
3 |
+
size 4362142872
|
model-00027-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba565b707250ddcf259d1470bb8f3e640fa2d6bbb25249b85f5adbc6a9ae04db
|
3 |
+
size 4362142872
|
model-00028-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02f34ce2f014323aae237610e3c40d737e10a291f96959e4a4447a8d12f3f2d1
|
3 |
+
size 4966188880
|
model-00029-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67bc2ba40596e7a0b076b5ef8a111271367ac10ba18b17b5b66e5471475ce5d2
|
3 |
+
size 4362142872
|
model-00030-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8488e31c285781984e5aafe41a22f27348e150405f7547fca2c787e08367914
|
3 |
+
size 4362142872
|
model-00031-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:662f0cec6350aeb946d3e9a6daa88c6f242957635e8b9d1ac3c6de277a9047e0
|
3 |
+
size 4966188880
|
model-00032-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:adb6792dbd8926f36cf212f49fb084e33f55028f1004aa681816ae819ddcbb76
|
3 |
+
size 4362142872
|
model-00033-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:218e0baeadad523f14998924284904f10f345ff59fddfe3dbfb3b4b798969863
|
3 |
+
size 4362142872
|
model-00034-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54ea946d7e740dfee1fc8df00bbbdf258af73f58ad718d26b40904b8918bfb07
|
3 |
+
size 4966188880
|
model-00035-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24ca7069c950b14633a9da8ca5f5c6dbb3c67707926448fe8916487d37e5ab52
|
3 |
+
size 4362142872
|
model-00036-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e0fa4a6af0e6ad2f255da2f0f067841a15513e434b5db93abc3c20aa3334115
|
3 |
+
size 4362142872
|
model-00037-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30ac564d204258ab9694c3ca708eea5fdb21e8c4b9e7f7cc6889c84834aa4329
|
3 |
+
size 4966188880
|
model-00038-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5748206318a01b01487712e5628597aaa4be642638a651df703c68b9e98bb7bc
|
3 |
+
size 4362142872
|
model-00039-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3388a4fcc4403325368d833fa282728249c211ac9724437be24a92b1be6b0bf
|
3 |
+
size 4362142872
|
model-00040-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37b9d2c5812a727c989b8ada4d7e75380c3de2e15d55f27823b8ed630bd583d5
|
3 |
+
size 4966188880
|
model-00041-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85dacb7b96033d84ba33862ec933ce6e421477ec15915761cfd539304c5e1aed
|
3 |
+
size 4362142872
|
model-00042-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab99e9c9f66976f7495a3d3a68705b0d5f8a4cf041664c7b46c92fe9c8c345ed
|
3 |
+
size 4362142872
|
model-00043-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe46cb9081d00335e7aa427b9121919c00bc9d835ccb535b32b8a47115c713d1
|
3 |
+
size 4966188880
|
model-00044-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c761cb2d5540c9332b6e1fbfeada54882794117d96ed4ae5b768546bce234a4
|
3 |
+
size 4362142872
|
model-00045-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d56b0a8a6e5a1d8a921b5de090744b400fd2d7d386a56617467b632283a53fd
|
3 |
+
size 4362142872
|
model-00046-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fc94b9a43bf7a24fc4e31181dd4f087260767e88a3f6ab5534385cfd084c8b9
|
3 |
+
size 4966188880
|
model-00047-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8681f5d0b98c710b62ade04956a10b701c5c39f84f2e58f9ae4aa739557e009
|
3 |
+
size 4362142872
|
model-00048-of-00062.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f83074672531e50b8bcb97c85ee93fa5ac0c40795ccc4901435c324cfcec22a
|
3 |
+
size 4362142872
|