SanjanaCodes
commited on
Commit
•
48e6e5f
1
Parent(s):
d2a238c
Upload model from local save
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- config.json +40 -0
- generation_config.json +12 -0
- pytorch_model-00001-of-00162.bin +3 -0
- pytorch_model-00002-of-00162.bin +3 -0
- pytorch_model-00003-of-00162.bin +3 -0
- pytorch_model-00004-of-00162.bin +3 -0
- pytorch_model-00005-of-00162.bin +3 -0
- pytorch_model-00006-of-00162.bin +3 -0
- pytorch_model-00007-of-00162.bin +3 -0
- pytorch_model-00008-of-00162.bin +3 -0
- pytorch_model-00009-of-00162.bin +3 -0
- pytorch_model-00010-of-00162.bin +3 -0
- pytorch_model-00011-of-00162.bin +3 -0
- pytorch_model-00012-of-00162.bin +3 -0
- pytorch_model-00013-of-00162.bin +3 -0
- pytorch_model-00014-of-00162.bin +3 -0
- pytorch_model-00015-of-00162.bin +3 -0
- pytorch_model-00016-of-00162.bin +3 -0
- pytorch_model-00017-of-00162.bin +3 -0
- pytorch_model-00018-of-00162.bin +3 -0
- pytorch_model-00019-of-00162.bin +3 -0
- pytorch_model-00020-of-00162.bin +3 -0
- pytorch_model-00021-of-00162.bin +3 -0
- pytorch_model-00022-of-00162.bin +3 -0
- pytorch_model-00023-of-00162.bin +3 -0
- pytorch_model-00024-of-00162.bin +3 -0
- pytorch_model-00025-of-00162.bin +3 -0
- pytorch_model-00026-of-00162.bin +3 -0
- pytorch_model-00027-of-00162.bin +3 -0
- pytorch_model-00028-of-00162.bin +3 -0
- pytorch_model-00029-of-00162.bin +3 -0
- pytorch_model-00030-of-00162.bin +3 -0
- pytorch_model-00031-of-00162.bin +3 -0
- pytorch_model-00032-of-00162.bin +3 -0
- pytorch_model-00033-of-00162.bin +3 -0
- pytorch_model-00034-of-00162.bin +3 -0
- pytorch_model-00035-of-00162.bin +3 -0
- pytorch_model-00036-of-00162.bin +3 -0
- pytorch_model-00037-of-00162.bin +3 -0
- pytorch_model-00038-of-00162.bin +3 -0
- pytorch_model-00039-of-00162.bin +3 -0
- pytorch_model-00040-of-00162.bin +3 -0
- pytorch_model-00041-of-00162.bin +3 -0
- pytorch_model-00042-of-00162.bin +3 -0
- pytorch_model-00043-of-00162.bin +3 -0
- pytorch_model-00044-of-00162.bin +3 -0
- pytorch_model-00045-of-00162.bin +3 -0
- pytorch_model-00046-of-00162.bin +3 -0
- pytorch_model-00047-of-00162.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
config.json
ADDED
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "meta-llama/Llama-3.1-8b-Instruct",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": [
|
10 |
+
128001,
|
11 |
+
128008,
|
12 |
+
128009
|
13 |
+
],
|
14 |
+
"head_dim": 128,
|
15 |
+
"hidden_act": "silu",
|
16 |
+
"hidden_size": 4096,
|
17 |
+
"initializer_range": 0.02,
|
18 |
+
"intermediate_size": 14336,
|
19 |
+
"max_position_embeddings": 131072,
|
20 |
+
"mlp_bias": false,
|
21 |
+
"model_type": "llama",
|
22 |
+
"num_attention_heads": 32,
|
23 |
+
"num_hidden_layers": 32,
|
24 |
+
"num_key_value_heads": 8,
|
25 |
+
"pretraining_tp": 1,
|
26 |
+
"rms_norm_eps": 1e-05,
|
27 |
+
"rope_scaling": {
|
28 |
+
"factor": 8.0,
|
29 |
+
"high_freq_factor": 4.0,
|
30 |
+
"low_freq_factor": 1.0,
|
31 |
+
"original_max_position_embeddings": 8192,
|
32 |
+
"rope_type": "llama3"
|
33 |
+
},
|
34 |
+
"rope_theta": 500000.0,
|
35 |
+
"tie_word_embeddings": false,
|
36 |
+
"torch_dtype": "float32",
|
37 |
+
"transformers_version": "4.46.3",
|
38 |
+
"use_cache": true,
|
39 |
+
"vocab_size": 128256
|
40 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 128000,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
128001,
|
6 |
+
128008,
|
7 |
+
128009
|
8 |
+
],
|
9 |
+
"temperature": 0.6,
|
10 |
+
"top_p": 0.9,
|
11 |
+
"transformers_version": "4.46.3"
|
12 |
+
}
|
pytorch_model-00001-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b7703b39d8c63695590a75e09e7ed6eed84747c8bfcb87d27fa4baa4e9c96e5
|
3 |
+
size 2101347717
|
pytorch_model-00002-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79a7a729d6178840a6c315fab2c1140a407200552086b0c2babe60b205e14c5e
|
3 |
+
size 83887830
|
pytorch_model-00003-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb85b3c1fb2cb0f5e11418ba1e12b925296c69de6991a471b922df0cf83e8e16
|
3 |
+
size 234882437
|
pytorch_model-00004-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a02508a1f5d4406cd4b2b925bb76cbb41aa961f49dc260190bd2ff800987d10
|
3 |
+
size 234882437
|
pytorch_model-00005-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e77ff35193175e7cbef360e628e9312632ffd25557b39b48c8d0bf6ce6d9e52
|
3 |
+
size 234882437
|
pytorch_model-00006-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f941f3fb0a197687f624692089289ba083f661e5ff42cde74be744735f301139
|
3 |
+
size 83921208
|
pytorch_model-00007-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39c892895361a4b21f4c69bddc59ed7cecaa054783e4e7d401d891bc5c5439df
|
3 |
+
size 83887830
|
pytorch_model-00008-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2726ef9e5e7a6c77971c7cb8ce3f4fbbea28b07f67c5bba605249bedd90e5d5
|
3 |
+
size 234882437
|
pytorch_model-00009-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c47c51e8d56fda10842e78b436135acfcbbaee66b4278ad665e8694e4647b191
|
3 |
+
size 234882437
|
pytorch_model-00010-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c89edbe75f6b591631f2d248e88557e273bf6abd9bafbda0c5f422bbedb4e120
|
3 |
+
size 234882437
|
pytorch_model-00011-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b16792be49ea16395a27a15bc6469b84819bbf41bb747b528378d318759b634
|
3 |
+
size 83921208
|
pytorch_model-00012-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7cdeeb095cee34aa1d110eb9f2d40364b3c8c78a5a7a3b50a4115dafc3165041
|
3 |
+
size 83887830
|
pytorch_model-00013-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b2d16c4ec6f43fa5308cef525782ff8cc6f65b7bc38ec163cfaa673c2251fd5
|
3 |
+
size 234882437
|
pytorch_model-00014-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:400c898992281632bba19f172b9fd15e6ae1a4f9b7211d7006f13b783876acb0
|
3 |
+
size 234882437
|
pytorch_model-00015-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72c037527babd9a2737cf1ad4642b7bece1edb5c9e7f02fb87b21e1c92cbc816
|
3 |
+
size 234882437
|
pytorch_model-00016-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66adb78584cb4c769bb889cfcc581a0e49f973135ae08a212db9f828f04f9ada
|
3 |
+
size 83921208
|
pytorch_model-00017-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:065ea6c35a593c92eb80d8617a6b9d4dc1d0f262efe8a8a4e9e87a80af7213cb
|
3 |
+
size 83887830
|
pytorch_model-00018-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1f3049d233bbef4933e1f152e60b175569e21ae8fb30bb12720fa22583f1477
|
3 |
+
size 234882437
|
pytorch_model-00019-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5fe27774ce627fe60e50848741dc75a2c89bf6579fbe0a695657e40dcfd07375
|
3 |
+
size 234882437
|
pytorch_model-00020-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82597344d832961811925a0c8d333fae479d3060631844c3b184810cab041cd5
|
3 |
+
size 234882437
|
pytorch_model-00021-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c62e59e090238f77e2eda60aea84691d8c26d74c1c9fe835aed21d2f2c0b20c
|
3 |
+
size 83921208
|
pytorch_model-00022-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71e11ad6c9e415487e216151ac01f26cf387bb678777938aa5d03b9cb5e4d94e
|
3 |
+
size 83887830
|
pytorch_model-00023-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04ae562f3fb74d7a3b6e944383d48546988eb65ea3fdd53021b5ca2a34704e2e
|
3 |
+
size 234882437
|
pytorch_model-00024-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:410846dae4753013ced8ff387947d7cdafca872489064f19bd5be44177e58d17
|
3 |
+
size 234882437
|
pytorch_model-00025-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d80f0df46ea112386173d5110547be96b00b336bf2416f20546a17746dc71b40
|
3 |
+
size 234882437
|
pytorch_model-00026-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89845ef68175bf631588ca47830de952cfa1d7599b521b92d3c7a8c691b0a9bb
|
3 |
+
size 83921208
|
pytorch_model-00027-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c9b2d2fc10e7eb1f7d5cc62612d95af4ec9ea12dd5cb9de2385184f764d2236
|
3 |
+
size 83887830
|
pytorch_model-00028-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab466e8483140c1fd401f0eb22bee758c327ab0b41afac5e7d5a61379197b24c
|
3 |
+
size 234882437
|
pytorch_model-00029-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a1ecb314a44ef6a3c3ebc35e829ee055988cf193ad5fdb73130751282a7fd1a
|
3 |
+
size 234882437
|
pytorch_model-00030-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fcf37c48bec630a21a0ac09753cf0342f9286beb1f3b353fd4248158c89f017
|
3 |
+
size 234882437
|
pytorch_model-00031-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25c16aa187a0d9ae1614d832fa168d0197391cb943df29148aa0dabd88bea239
|
3 |
+
size 83921208
|
pytorch_model-00032-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3124672d7fb279a41dd4606403e0c1dce6b1b53a6eb81392591433968010ef70
|
3 |
+
size 83887830
|
pytorch_model-00033-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26133d9a86756b4cf05ddb92451b77f6a12291524942aec7e3aa1c18a7d68f29
|
3 |
+
size 234882437
|
pytorch_model-00034-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:872b65f4ac60e10f7b73613efac67a5da792f9c53ad051e0f14fb76b90e5a582
|
3 |
+
size 234882437
|
pytorch_model-00035-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eda50d9e0c4b01120db8640aa5d201bc5cdcfc57a2bde233fae80c564c40b4b5
|
3 |
+
size 234882437
|
pytorch_model-00036-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae6814b9d449c91feb7a1f872fcfd5de617687ff95b66c2d6aa039560ea17860
|
3 |
+
size 83921208
|
pytorch_model-00037-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4db6f520cd58f0bf171cb396312ed5b8cf0d5731a00e3b0a25747c3572787cd5
|
3 |
+
size 83887830
|
pytorch_model-00038-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:922dfcecbbe79c3cd7846bbbfe6838422402148ce798db479fb04e28c4ec9ab8
|
3 |
+
size 234882437
|
pytorch_model-00039-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:403c4e059bf21ce6fb89c470d2643a79f230728d99fb7c39afc77a2fb83cf416
|
3 |
+
size 234882437
|
pytorch_model-00040-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60dadf2e3fe49870a27c983dc55edfeefa91bcdb81a15a52723d680f74bed1c2
|
3 |
+
size 234882437
|
pytorch_model-00041-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1161581a2dbcc334d79a8b9e650c1363880d603c83e502fd72fd0367405e9084
|
3 |
+
size 83921208
|
pytorch_model-00042-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b2c58b10c8ec1ec62dbd72a4fc80cba07a55816c37b2cd4a1eb295209025d03
|
3 |
+
size 83887830
|
pytorch_model-00043-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcb675efac85ca8271c5684b59b8e73289e3f2d5797a9248810fbc6bcc52ebbc
|
3 |
+
size 234882437
|
pytorch_model-00044-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:509008f3eef60e5f2764b1dbbafcd335ced9578d54b2275f2863b75e009187c3
|
3 |
+
size 234882437
|
pytorch_model-00045-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9f2b472bfdb63cdce85fc68a481cf82f70670a764db75ca9310fa0a5b7778bf
|
3 |
+
size 234882437
|
pytorch_model-00046-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75acd66e6d83d740406df674efb1d7936cb1dc46a33684217e1085aeda83244f
|
3 |
+
size 83921208
|
pytorch_model-00047-of-00162.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad54a0c92ac4914b23990eb4415026e4ab936ee53e3377330a5120e5d391820b
|
3 |
+
size 83887830
|