Lyaaaaaaaaaaaaaaa commited on
Commit
57f5ca4
1 Parent(s): 6c25415

Upload 75 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +82 -0
  2. generation_config.json +6 -0
  3. merges.txt +0 -0
  4. pytorch_model-00001-of-00067.bin +3 -0
  5. pytorch_model-00002-of-00067.bin +3 -0
  6. pytorch_model-00003-of-00067.bin +3 -0
  7. pytorch_model-00004-of-00067.bin +3 -0
  8. pytorch_model-00005-of-00067.bin +3 -0
  9. pytorch_model-00006-of-00067.bin +3 -0
  10. pytorch_model-00007-of-00067.bin +3 -0
  11. pytorch_model-00008-of-00067.bin +3 -0
  12. pytorch_model-00009-of-00067.bin +3 -0
  13. pytorch_model-00010-of-00067.bin +3 -0
  14. pytorch_model-00011-of-00067.bin +3 -0
  15. pytorch_model-00012-of-00067.bin +3 -0
  16. pytorch_model-00013-of-00067.bin +3 -0
  17. pytorch_model-00014-of-00067.bin +3 -0
  18. pytorch_model-00015-of-00067.bin +3 -0
  19. pytorch_model-00016-of-00067.bin +3 -0
  20. pytorch_model-00017-of-00067.bin +3 -0
  21. pytorch_model-00018-of-00067.bin +3 -0
  22. pytorch_model-00019-of-00067.bin +3 -0
  23. pytorch_model-00020-of-00067.bin +3 -0
  24. pytorch_model-00021-of-00067.bin +3 -0
  25. pytorch_model-00022-of-00067.bin +3 -0
  26. pytorch_model-00023-of-00067.bin +3 -0
  27. pytorch_model-00024-of-00067.bin +3 -0
  28. pytorch_model-00025-of-00067.bin +3 -0
  29. pytorch_model-00026-of-00067.bin +3 -0
  30. pytorch_model-00027-of-00067.bin +3 -0
  31. pytorch_model-00028-of-00067.bin +3 -0
  32. pytorch_model-00029-of-00067.bin +3 -0
  33. pytorch_model-00030-of-00067.bin +3 -0
  34. pytorch_model-00031-of-00067.bin +3 -0
  35. pytorch_model-00032-of-00067.bin +3 -0
  36. pytorch_model-00033-of-00067.bin +3 -0
  37. pytorch_model-00034-of-00067.bin +3 -0
  38. pytorch_model-00035-of-00067.bin +3 -0
  39. pytorch_model-00036-of-00067.bin +3 -0
  40. pytorch_model-00037-of-00067.bin +3 -0
  41. pytorch_model-00038-of-00067.bin +3 -0
  42. pytorch_model-00039-of-00067.bin +3 -0
  43. pytorch_model-00040-of-00067.bin +3 -0
  44. pytorch_model-00041-of-00067.bin +3 -0
  45. pytorch_model-00042-of-00067.bin +3 -0
  46. pytorch_model-00043-of-00067.bin +3 -0
  47. pytorch_model-00044-of-00067.bin +3 -0
  48. pytorch_model-00045-of-00067.bin +3 -0
  49. pytorch_model-00046-of-00067.bin +3 -0
  50. pytorch_model-00047-of-00067.bin +3 -0
config.json ADDED
@@ -0,0 +1,82 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "EleutherAI/gpt-neo-2.7B",
3
+ "activation_function": "gelu_new",
4
+ "architectures": [
5
+ "GPTNeoForCausalLM"
6
+ ],
7
+ "attention_dropout": 0,
8
+ "attention_layers": [
9
+ "global",
10
+ "local",
11
+ "global",
12
+ "local",
13
+ "global",
14
+ "local",
15
+ "global",
16
+ "local",
17
+ "global",
18
+ "local",
19
+ "global",
20
+ "local",
21
+ "global",
22
+ "local",
23
+ "global",
24
+ "local",
25
+ "global",
26
+ "local",
27
+ "global",
28
+ "local",
29
+ "global",
30
+ "local",
31
+ "global",
32
+ "local",
33
+ "global",
34
+ "local",
35
+ "global",
36
+ "local",
37
+ "global",
38
+ "local",
39
+ "global",
40
+ "local"
41
+ ],
42
+ "attention_types": [
43
+ [
44
+ [
45
+ "global",
46
+ "local"
47
+ ],
48
+ 16
49
+ ]
50
+ ],
51
+ "bos_token_id": 50256,
52
+ "embed_dropout": 0,
53
+ "eos_token_id": 50256,
54
+ "gradient_checkpointing": false,
55
+ "hidden_size": 2560,
56
+ "initializer_range": 0.02,
57
+ "intermediate_size": null,
58
+ "layer_norm_epsilon": 1e-05,
59
+ "max_position_embeddings": 2048,
60
+ "model_type": "gpt_neo",
61
+ "num_heads": 20,
62
+ "num_layers": 32,
63
+ "resid_dropout": 0,
64
+ "summary_activation": null,
65
+ "summary_first_dropout": 0.1,
66
+ "summary_proj_to_labels": true,
67
+ "summary_type": "cls_index",
68
+ "summary_use_proj": true,
69
+ "task_specific_params": {
70
+ "text-generation": {
71
+ "do_sample": true,
72
+ "max_length": 50,
73
+ "temperature": 0.9
74
+ }
75
+ },
76
+ "tokenizer_class": "GPT2Tokenizer",
77
+ "torch_dtype": "float32",
78
+ "transformers_version": "4.27.4",
79
+ "use_cache": true,
80
+ "vocab_size": 50257,
81
+ "window_size": 256
82
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 50256,
4
+ "eos_token_id": 50256,
5
+ "transformers_version": "4.27.4"
6
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
pytorch_model-00001-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c25394dae9525a82566ce0eadac7dd3e5a7cd7a43a6efc94c6a3ac6296fb34f9
3
+ size 537
pytorch_model-00002-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1101cff3c0d7930e1b7c451779af3d3acb770e045758c140a5673b7614c629f9
3
+ size 514632618
pytorch_model-00003-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96812cc0e5d834c4310e708790f804f3d6cc6fdeff3c93068c49c0bf2e6da3b1
3
+ size 130078951
pytorch_model-00004-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13d0dffb7d74c33b03e197247b3dcd4e3186288756048cfc09faf4c86f81cdfc
3
+ size 104899771
pytorch_model-00005-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3419e1fdef9991097e0aa9e3f54d73c0897d85506e593fc318603c892814a24
3
+ size 187729266
pytorch_model-00006-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a68456c8cbf6e5e7bc3b10e3f9d6e44f69efad2df993363af8815f83e40395e0
3
+ size 131146111
pytorch_model-00007-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58d1d4ac33092a9353d0e7ac3ad2b6b3d4fbbf131a989f9f1a7e10e00461820d
3
+ size 187729266
pytorch_model-00008-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6a04f6b77aae6196cbb0bab3eff86de37bffdd415ae19f6ac6ccc7154921b2c
3
+ size 131146111
pytorch_model-00009-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8f6064b6f03bc912644bfa4560572ebc633f03cdea8d77c073294d090f24191
3
+ size 187729266
pytorch_model-00010-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e51dbe98b9d3c8509dedcc9c029be0a6ff84d325800065d06a1c48b641555db0
3
+ size 131146111
pytorch_model-00011-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32bec2e58f5984e59323d406f386760d21c3727c89a56c3678e4b69001deeaec
3
+ size 187729266
pytorch_model-00012-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ef5d57d300b584800556f0c0d3c5a48941c32a030bf9b61c523b9c6304f869f
3
+ size 131146111
pytorch_model-00013-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a268d20150c89c30c09a828db0a586941dc1e459972548a0947125e309478efd
3
+ size 187729266
pytorch_model-00014-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc71371e016f85e25a08a3e0213fb85e0310bd642dae202d5e7f06113a185772
3
+ size 131146111
pytorch_model-00015-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edb10a883d19621826be15883063841e4dbe492c7ceba98e03aaa9028b389237
3
+ size 187729266
pytorch_model-00016-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5571fed4f70fa9b215890e0c7b7e355d662eb10327f70df16ad5cfe2f5291f96
3
+ size 131146111
pytorch_model-00017-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41b881d967af1796e04dc8d0050493747d09c44c6e8c293712a23c88bf026af1
3
+ size 187729266
pytorch_model-00018-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44e8c1a83188b0b260fa8759252217733a37333845bc781f17ee83576459e750
3
+ size 131146111
pytorch_model-00019-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:814577f613c7338521fd3f9dab79712573e965a22cddac662b5c41dab6c3bf3a
3
+ size 187729266
pytorch_model-00020-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:016fd3eb61fa1f22d2eeea5a65b0707232dd7739977359fc624a2c20bee96ec9
3
+ size 131146111
pytorch_model-00021-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49e1cc7591c0530db0f2941874609afeb1f4035b0d5867366f5bec9101ecc79f
3
+ size 187729266
pytorch_model-00022-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2c7ca00a15206c8262c7e3e8cb313bd5a41370937c0a1328de6f58c519870c4
3
+ size 131146111
pytorch_model-00023-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19efc143e6c88fdceb18d4c3d1e21733817ab6e00e97cd847434ab9d9240d9e7
3
+ size 187729266
pytorch_model-00024-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00d0b0875ba05193d6b25f8efb92a8d710211b360f7a8779fbc067a7659e1c74
3
+ size 131146111
pytorch_model-00025-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df68dbf3cc50c0e7cf2ca1ee47f71fdc037393653b85a563707fbb953d0a25f4
3
+ size 187729266
pytorch_model-00026-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2749317d5763f3fccfc067dda4406bae408a069f2ba6a7f72e52574b9fefc98
3
+ size 131146111
pytorch_model-00027-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4dfcd957bcba370c61a3c921ff354c03e2d5a09ecb9218d899daf7d3fbb8648e
3
+ size 187729266
pytorch_model-00028-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a7f0a66f2eda014ef6d59131c311ebea52f72c6abbc233443b20bca1f0cd7ac
3
+ size 131146111
pytorch_model-00029-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:604b65ee4fa39e92b12dc4815e0ace8bc8920f1ebf24b14c8eda328675820560
3
+ size 187729266
pytorch_model-00030-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f5d448d35f47ddd8b3ee1d0079605ac9fe155e91204c08ce535d55895b39572
3
+ size 131146111
pytorch_model-00031-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3704b8e266d9d10057714ad06621e23aee44981b72f45ad99ba77218e73bff83
3
+ size 187729266
pytorch_model-00032-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04aa5802576b5bbfc913f881d89726ed513772af2a60c761145043cbf3320711
3
+ size 131146111
pytorch_model-00033-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24101a58aaa999e17e6eea45ec5ef554172ff6913a0801c9a60837d07dfdaaf4
3
+ size 187729266
pytorch_model-00034-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03d727d1532e819036e8039c1a36c048a5dde36e07f4f9d95ff2f3d9fa28e921
3
+ size 131146111
pytorch_model-00035-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ca035894a96948c0e7e6a7ee4621405aadd905b3426ef5224689a731e271412
3
+ size 187729266
pytorch_model-00036-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2961fe1deca7428501ffafa5d84aeb5e186d8dbd73dd07da79aa31e939378961
3
+ size 131146111
pytorch_model-00037-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f768a528d049fe2bd356c15ec64b8dd05c7aa7200d2483a78cb5633308e1b2f
3
+ size 187729266
pytorch_model-00038-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed62aa2e131327a6d29b039321cbdccc5d84f19f8e257d48db17080682bb7d2f
3
+ size 131146111
pytorch_model-00039-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d24fb976190da73a8ac00f1469ca7d70e8b95c8ae3eb9e562eb574880101b59a
3
+ size 187729266
pytorch_model-00040-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b424ab76f4dcf10733e1a49456fbc5b07e9061652b4bd8e747edc9ab9cb5879
3
+ size 131146111
pytorch_model-00041-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2590d97ebe6ef54d690d00506171b648931afd6bf3c56e1247b80ac2ecbc579a
3
+ size 187729266
pytorch_model-00042-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b79d6cb942a194465a77e96ffcbf3201b7c1f274f39208182832f79adb845179
3
+ size 131146111
pytorch_model-00043-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e508d93657040d4ddc59d1112f9af2223095793adc22362f72bc0edf6c773450
3
+ size 187729266
pytorch_model-00044-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55c2c5d165bf8a74de7339ffc61db9d9e532b774cf65c68273f61eaad3415dc8
3
+ size 131146111
pytorch_model-00045-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c77a85b283aa63b8e38ffcc0848a3ea750e83a7234d27ce658d6038294f80091
3
+ size 187729266
pytorch_model-00046-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33d22339a6d1474ee17ef72e7ca0ff617e6169b4dbadcedf3724fa24146315fd
3
+ size 131146111
pytorch_model-00047-of-00067.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba67aa11d62517e6f3e5e3037b2cd33abee7e4aeb3ac86c61b7d55bb19c40559
3
+ size 187729266