init
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +28 -0
- generation_config.json +7 -0
- model-00001-of-00201.safetensors +3 -0
- model-00002-of-00201.safetensors +3 -0
- model-00003-of-00201.safetensors +3 -0
- model-00004-of-00201.safetensors +3 -0
- model-00005-of-00201.safetensors +3 -0
- model-00006-of-00201.safetensors +3 -0
- model-00007-of-00201.safetensors +3 -0
- model-00008-of-00201.safetensors +3 -0
- model-00009-of-00201.safetensors +3 -0
- model-00010-of-00201.safetensors +3 -0
- model-00011-of-00201.safetensors +3 -0
- model-00012-of-00201.safetensors +3 -0
- model-00013-of-00201.safetensors +3 -0
- model-00014-of-00201.safetensors +3 -0
- model-00015-of-00201.safetensors +3 -0
- model-00016-of-00201.safetensors +3 -0
- model-00017-of-00201.safetensors +3 -0
- model-00018-of-00201.safetensors +3 -0
- model-00019-of-00201.safetensors +3 -0
- model-00020-of-00201.safetensors +3 -0
- model-00021-of-00201.safetensors +3 -0
- model-00022-of-00201.safetensors +3 -0
- model-00023-of-00201.safetensors +3 -0
- model-00024-of-00201.safetensors +3 -0
- model-00025-of-00201.safetensors +3 -0
- model-00026-of-00201.safetensors +3 -0
- model-00027-of-00201.safetensors +3 -0
- model-00028-of-00201.safetensors +3 -0
- model-00029-of-00201.safetensors +3 -0
- model-00030-of-00201.safetensors +3 -0
- model-00031-of-00201.safetensors +3 -0
- model-00032-of-00201.safetensors +3 -0
- model-00033-of-00201.safetensors +3 -0
- model-00034-of-00201.safetensors +3 -0
- model-00035-of-00201.safetensors +3 -0
- model-00036-of-00201.safetensors +3 -0
- model-00037-of-00201.safetensors +3 -0
- model-00038-of-00201.safetensors +3 -0
- model-00039-of-00201.safetensors +3 -0
- model-00040-of-00201.safetensors +3 -0
- model-00041-of-00201.safetensors +3 -0
- model-00042-of-00201.safetensors +3 -0
- model-00043-of-00201.safetensors +3 -0
- model-00044-of-00201.safetensors +3 -0
- model-00045-of-00201.safetensors +3 -0
- model-00046-of-00201.safetensors +3 -0
- model-00047-of-00201.safetensors +3 -0
- model-00048-of-00201.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "TinyLlama/TinyLlama-1.1B-intermediate-step-955k-token-2T",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 2048,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 5632,
|
14 |
+
"max_position_embeddings": 2048,
|
15 |
+
"model_type": "llama",
|
16 |
+
"num_attention_heads": 32,
|
17 |
+
"num_hidden_layers": 22,
|
18 |
+
"num_key_value_heads": 4,
|
19 |
+
"pretraining_tp": 1,
|
20 |
+
"rms_norm_eps": 1e-05,
|
21 |
+
"rope_scaling": null,
|
22 |
+
"rope_theta": 10000.0,
|
23 |
+
"tie_word_embeddings": false,
|
24 |
+
"torch_dtype": "float16",
|
25 |
+
"transformers_version": "4.36.0.dev0",
|
26 |
+
"use_cache": true,
|
27 |
+
"vocab_size": 32000
|
28 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 1,
|
3 |
+
"eos_token_id": 2,
|
4 |
+
"max_length": 2048,
|
5 |
+
"pad_token_id": 0,
|
6 |
+
"transformers_version": "4.36.0.dev0"
|
7 |
+
}
|
model-00001-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:460b49c839775d9abb2090834b410e6c9cdfefffbb86caa359f4280bd05a8b3e
|
3 |
+
size 131072128
|
model-00002-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34efda8a91eebdc88a550052d76be96f90d00d4fee586ca2984c577c5892f853
|
3 |
+
size 131072136
|
model-00003-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7df343eb89f6ac3533370a12c913e2dbd6d7584e42bf2f42fd78ad34d82f8c11
|
3 |
+
size 4232
|
model-00004-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:061d770acc2f5da19d02a32f627e33234454a16e50c64323d519743b7e427dea
|
3 |
+
size 23068816
|
model-00005-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e501b9fcf4e673b644ec490120a0e3ae904772d95715e46833a3b1d7e247c3de
|
3 |
+
size 23068816
|
model-00006-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e31205e4c6e13adf18683b47e034ed962a400e2d029ff80106afaae6f2925e4c
|
3 |
+
size 23068816
|
model-00007-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5cf2cda7a2751716cabf92b0a5f758e5317fad5c988bf9f2e38d3790c2c2f4e
|
3 |
+
size 4248
|
model-00008-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e09246836320791d69ccaa91477b205cf2c62b6345c5ee8ac236d3a10ec806b4
|
3 |
+
size 1048720
|
model-00009-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:379a4803fbe0dc2da0c344c4d11e8bf4e66386368cc9f5879697d9f0cea1b8a5
|
3 |
+
size 8388760
|
model-00010-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fd4c4e939328474a1fffb7b38cb03da90e413e4013f44ffc450aeeae9b5b4ac
|
3 |
+
size 8388760
|
model-00011-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8415bdd15937a991796cfafcaf929e84a43329a6d4768c3b58013ab157bcaf2b
|
3 |
+
size 1048720
|
model-00012-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d879e42d31eb3ea140ca044624a83160cd12a4e4bf6fa6209fe05594a414e926
|
3 |
+
size 4232
|
model-00013-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c252ed283fc9a99dd1a6598be13938e48d809113805128135f8a0683e33e3f33
|
3 |
+
size 23068816
|
model-00014-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4c4a6a1755b86fa655be4a74b76597ae3b3184d62cf4f6c656a6ed128308547
|
3 |
+
size 23068816
|
model-00015-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:464373475cd9891ba80623899bfcc509e8a45f15658fe259ce26c925c0193ca1
|
3 |
+
size 23068816
|
model-00016-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9d2e0581180ac8115be1cfbb15369cd58a536241c4cdce1149bef057bf07289
|
3 |
+
size 4248
|
model-00017-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22e145c093067784a714afa1e74a64214014f4b26205241578d2ebebfccce818
|
3 |
+
size 1048720
|
model-00018-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e46d2d546d4ba3f690c40d9518014cb11abfc8e7770eecfe41a64f7192b6e14
|
3 |
+
size 8388760
|
model-00019-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6cb4604f58b225dc33a0193cea560c36f9c42310a96fb5b53959eeee8823035
|
3 |
+
size 8388760
|
model-00020-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07a8b0e1e754ce82e9f5e062855b1da23032d81c6d25490cb74c1ed7dbf6d8c8
|
3 |
+
size 1048720
|
model-00021-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d088f8e1a6c0717d1d35895be7a4a22ed4ac6bf29b091d984c7912acf487c244
|
3 |
+
size 4232
|
model-00022-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c3d47c84048d605eb9117453e5945d0c1fcd88bd091a3f8241a5f94629bc3c9
|
3 |
+
size 23068816
|
model-00023-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:717d9bcadf628a082054c8c6415bfdfd279ae9606e5d167932cbc0352648b66b
|
3 |
+
size 23068816
|
model-00024-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcbeed37ff77a5ee9d192add17497f816fce79d5506be64cb8475a2e46375f35
|
3 |
+
size 23068816
|
model-00025-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64d17eaac55e87a54e2e42debe35edcf1e14d9264ffb4b60f20fc4b04589ae85
|
3 |
+
size 4248
|
model-00026-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b783c5ce3ccb97cb1507dbdcf1d5a89e9c8156d36fb6f7f7149637aa6f47cd15
|
3 |
+
size 1048720
|
model-00027-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:573108e9b9313727081d14b29a77a84dff06adc12d7f84829a843047dabe492e
|
3 |
+
size 8388760
|
model-00028-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d053bf7ff20cd5d17268a0341e2805a80008799e989e88b1989c8e6bdf40a35b
|
3 |
+
size 8388760
|
model-00029-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03d10956eb679c1ef6a6858e40e9b6c8b63954e500df7e61ab8a9d20f9160222
|
3 |
+
size 1048720
|
model-00030-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:192b132566ff966bb9bafd203f2a4021e2312cbf5fdaf7a46490d935e74a6df7
|
3 |
+
size 4232
|
model-00031-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94bd1cf4b15d77e78de525980de4d55b36736bdd1cfc6996294cba24be28015e
|
3 |
+
size 23068816
|
model-00032-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b112be4a8d15c4c371be80598b1df6f958a904ee0d87619a52e438fa02d0c438
|
3 |
+
size 23068816
|
model-00033-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92842f701662dd3683f918eae916ab2707381fab0a49c03b9634e772042c3247
|
3 |
+
size 23068816
|
model-00034-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e11adc5d50d21158f097f83cd080727fac00d2f6be1684ca09aa89d0071fb510
|
3 |
+
size 4248
|
model-00035-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70c21c78a2c6363f619ce88fb96865daa3e21ed4c979907eeb5a8055f7983276
|
3 |
+
size 1048720
|
model-00036-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a79b560b44ca4f243f1d643100b97301f8777820b584e4a13b6fe820bfe6ed9d
|
3 |
+
size 8388760
|
model-00037-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:564a67bb3155bb15fdfad09d834f94ca0abdf75896610ccdca25c43ea3b6af63
|
3 |
+
size 8388760
|
model-00038-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c59311e54c14f9cb05823f577cc01eed0b689bbb4c193ccecb461f0335d3115
|
3 |
+
size 1048720
|
model-00039-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5861756ebe28fad7aed09d2a2f86417c48a42fe25b4617a26a5ef175e747679
|
3 |
+
size 4232
|
model-00040-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e47054eb9fccf9de534daf055a637f583ca83c5fec4ecb6723083859ddd5f76e
|
3 |
+
size 23068816
|
model-00041-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7583dd7d88bb6d8616f8b734d0409dde3d5564b25e311795c047b96cd5bd5fd6
|
3 |
+
size 23068816
|
model-00042-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9d67801717d5c6ac78b9b09f6baba223f2ce076f973d3b4fe79b8c2bbfc213b
|
3 |
+
size 23068816
|
model-00043-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4223e2c1f938c91cb09beaec0cd1d46208b7e66fa1138ada9418f22fe69cb9a
|
3 |
+
size 4248
|
model-00044-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8a621291b46c8eee19c55cb47d2f081496fd67ae48c659b8c95be2bfdd3995b
|
3 |
+
size 1048720
|
model-00045-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77413a82be3eb2e9284d38ceca8393f6493f8989ac9688746cf4fd1868e65a53
|
3 |
+
size 8388760
|
model-00046-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36af101db4cf2a4e2e206c4a8a77597c6f9e76954ca252d066997932f4051937
|
3 |
+
size 8388760
|
model-00047-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7000ee0d6568145314610c544b626131f3b1bb3b138a3b4afdcfb26d14d24838
|
3 |
+
size 1048720
|
model-00048-of-00201.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:852cfb6a09ba2d10135d1aaf4e611803c61fad4f007416b72ffef9894df6e8db
|
3 |
+
size 4232
|