xpsychted commited on
Commit
1af1c2d
1 Parent(s): 1d9661f

Upload 63 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. flan-t5-xl-sharded/config.json +62 -0
  2. flan-t5-xl-sharded/generation_config.json +7 -0
  3. flan-t5-xl-sharded/pytorch_model-00001-of-00060.bin +3 -0
  4. flan-t5-xl-sharded/pytorch_model-00002-of-00060.bin +3 -0
  5. flan-t5-xl-sharded/pytorch_model-00003-of-00060.bin +3 -0
  6. flan-t5-xl-sharded/pytorch_model-00004-of-00060.bin +3 -0
  7. flan-t5-xl-sharded/pytorch_model-00005-of-00060.bin +3 -0
  8. flan-t5-xl-sharded/pytorch_model-00006-of-00060.bin +3 -0
  9. flan-t5-xl-sharded/pytorch_model-00007-of-00060.bin +3 -0
  10. flan-t5-xl-sharded/pytorch_model-00008-of-00060.bin +3 -0
  11. flan-t5-xl-sharded/pytorch_model-00009-of-00060.bin +3 -0
  12. flan-t5-xl-sharded/pytorch_model-00010-of-00060.bin +3 -0
  13. flan-t5-xl-sharded/pytorch_model-00011-of-00060.bin +3 -0
  14. flan-t5-xl-sharded/pytorch_model-00012-of-00060.bin +3 -0
  15. flan-t5-xl-sharded/pytorch_model-00013-of-00060.bin +3 -0
  16. flan-t5-xl-sharded/pytorch_model-00014-of-00060.bin +3 -0
  17. flan-t5-xl-sharded/pytorch_model-00015-of-00060.bin +3 -0
  18. flan-t5-xl-sharded/pytorch_model-00016-of-00060.bin +3 -0
  19. flan-t5-xl-sharded/pytorch_model-00017-of-00060.bin +3 -0
  20. flan-t5-xl-sharded/pytorch_model-00018-of-00060.bin +3 -0
  21. flan-t5-xl-sharded/pytorch_model-00019-of-00060.bin +3 -0
  22. flan-t5-xl-sharded/pytorch_model-00020-of-00060.bin +3 -0
  23. flan-t5-xl-sharded/pytorch_model-00021-of-00060.bin +3 -0
  24. flan-t5-xl-sharded/pytorch_model-00022-of-00060.bin +3 -0
  25. flan-t5-xl-sharded/pytorch_model-00023-of-00060.bin +3 -0
  26. flan-t5-xl-sharded/pytorch_model-00024-of-00060.bin +3 -0
  27. flan-t5-xl-sharded/pytorch_model-00025-of-00060.bin +3 -0
  28. flan-t5-xl-sharded/pytorch_model-00026-of-00060.bin +3 -0
  29. flan-t5-xl-sharded/pytorch_model-00027-of-00060.bin +3 -0
  30. flan-t5-xl-sharded/pytorch_model-00028-of-00060.bin +3 -0
  31. flan-t5-xl-sharded/pytorch_model-00029-of-00060.bin +3 -0
  32. flan-t5-xl-sharded/pytorch_model-00030-of-00060.bin +3 -0
  33. flan-t5-xl-sharded/pytorch_model-00031-of-00060.bin +3 -0
  34. flan-t5-xl-sharded/pytorch_model-00032-of-00060.bin +3 -0
  35. flan-t5-xl-sharded/pytorch_model-00033-of-00060.bin +3 -0
  36. flan-t5-xl-sharded/pytorch_model-00034-of-00060.bin +3 -0
  37. flan-t5-xl-sharded/pytorch_model-00035-of-00060.bin +3 -0
  38. flan-t5-xl-sharded/pytorch_model-00036-of-00060.bin +3 -0
  39. flan-t5-xl-sharded/pytorch_model-00037-of-00060.bin +3 -0
  40. flan-t5-xl-sharded/pytorch_model-00038-of-00060.bin +3 -0
  41. flan-t5-xl-sharded/pytorch_model-00039-of-00060.bin +3 -0
  42. flan-t5-xl-sharded/pytorch_model-00040-of-00060.bin +3 -0
  43. flan-t5-xl-sharded/pytorch_model-00041-of-00060.bin +3 -0
  44. flan-t5-xl-sharded/pytorch_model-00042-of-00060.bin +3 -0
  45. flan-t5-xl-sharded/pytorch_model-00043-of-00060.bin +3 -0
  46. flan-t5-xl-sharded/pytorch_model-00044-of-00060.bin +3 -0
  47. flan-t5-xl-sharded/pytorch_model-00045-of-00060.bin +3 -0
  48. flan-t5-xl-sharded/pytorch_model-00046-of-00060.bin +3 -0
  49. flan-t5-xl-sharded/pytorch_model-00047-of-00060.bin +3 -0
  50. flan-t5-xl-sharded/pytorch_model-00048-of-00060.bin +3 -0
flan-t5-xl-sharded/config.json ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "google/flan-t5-xl",
3
+ "architectures": [
4
+ "T5ForConditionalGeneration"
5
+ ],
6
+ "classifier_dropout": 0.0,
7
+ "d_ff": 5120,
8
+ "d_kv": 64,
9
+ "d_model": 2048,
10
+ "decoder_start_token_id": 0,
11
+ "dense_act_fn": "gelu_new",
12
+ "dropout_rate": 0.1,
13
+ "eos_token_id": 1,
14
+ "feed_forward_proj": "gated-gelu",
15
+ "initializer_factor": 1.0,
16
+ "is_encoder_decoder": true,
17
+ "is_gated_act": true,
18
+ "layer_norm_epsilon": 1e-06,
19
+ "model_type": "t5",
20
+ "n_positions": 512,
21
+ "num_decoder_layers": 24,
22
+ "num_heads": 32,
23
+ "num_layers": 24,
24
+ "output_past": true,
25
+ "pad_token_id": 0,
26
+ "relative_attention_max_distance": 128,
27
+ "relative_attention_num_buckets": 32,
28
+ "task_specific_params": {
29
+ "summarization": {
30
+ "early_stopping": true,
31
+ "length_penalty": 2.0,
32
+ "max_length": 200,
33
+ "min_length": 30,
34
+ "no_repeat_ngram_size": 3,
35
+ "num_beams": 4,
36
+ "prefix": "summarize: "
37
+ },
38
+ "translation_en_to_de": {
39
+ "early_stopping": true,
40
+ "max_length": 300,
41
+ "num_beams": 4,
42
+ "prefix": "translate English to German: "
43
+ },
44
+ "translation_en_to_fr": {
45
+ "early_stopping": true,
46
+ "max_length": 300,
47
+ "num_beams": 4,
48
+ "prefix": "translate English to French: "
49
+ },
50
+ "translation_en_to_ro": {
51
+ "early_stopping": true,
52
+ "max_length": 300,
53
+ "num_beams": 4,
54
+ "prefix": "translate English to Romanian: "
55
+ }
56
+ },
57
+ "tie_word_embeddings": false,
58
+ "torch_dtype": "float32",
59
+ "transformers_version": "4.33.0",
60
+ "use_cache": true,
61
+ "vocab_size": 32128
62
+ }
flan-t5-xl-sharded/generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "decoder_start_token_id": 0,
4
+ "eos_token_id": 1,
5
+ "pad_token_id": 0,
6
+ "transformers_version": "4.33.0"
7
+ }
flan-t5-xl-sharded/pytorch_model-00001-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b6e6074eea25c2fff075960e9fc440cbd60944f475ee8a73b6e6414772aa377
3
+ size 263193642
flan-t5-xl-sharded/pytorch_model-00002-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf24db533e9a0678ef4e4602fe9f5add333fc50ccaaf56acba5a85d1dc49e7f7
3
+ size 192962307
flan-t5-xl-sharded/pytorch_model-00003-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bceccc159e3f828ce9407e9d9bde8e671db3d134433583570cd9e7551363930
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00004-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31ca83212541bd37284ec5d7540cdabab3e0f7369629420392e6bb136da70b47
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00005-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3c3223f89cf30ef76d631b038694f08b80bfcbe632314eff24fc3f8c865c20b
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00006-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d363580ca0532984b0ebc233bd6803b6614c5365d39f422c7bfdb06df40826be
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00007-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df20ed9d541a139b1a229ba96f73eda8af1c58941b0411ec80d6f22314783748
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00008-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4ec9f5d1d17c33f797966bdca40ab2f4d513cb81894d4142c66cd4d4055f63d
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00009-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3147a0c4152c2c9b459934a5d668b96741236e6b63a29c2a5c4cde7a8ebc4b89
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00010-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21d9a8592ecd81c10852d236f06947a78c528af9bb88d208b59f5dbdb390d161
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00011-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1734774f79fd2ec12296ace14ebeca4387f2a397a3f27d49de2ec67ad7857c2
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00012-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e09703a351323bfb169db977868145a3ac547e8e5750d130456177b63f518d03
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00013-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52af75bb204d93273f960e1da7c5980b39faa7b2c9eb1a97bca9cfb4759d6219
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00014-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:118638b13dc1aca60eaf5cf2bdf0b1e0f3823b020ccc6d6e0e0d298d49e22286
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00015-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc265cb8d4894276975d97803b952d7520ce60f8c9ad8adc976cab92483883f2
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00016-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4abd10799adf9b41c182ca58dd88c9b108c3ee4337825b85a1673a507ef63b8
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00017-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a91c7785999307a90721fd58a774dc0d9df44004d82d90a6fa399f3ec1e2caa5
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00018-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:691e88cea99e09b8ce14991bb5b053128d8530ed29590a3cc5f908db953700e4
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00019-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9c887ae2292a02ff5cc67ef2c489af28d61dfdd52d8f878f582f2b51791a33c
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00020-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f37d2fe108c8607423b0fd6c87ab0ec222bfd65eccd9e731f540f40ec064770e
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00021-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a1d62a77f68a377906f05f393d0745eff299b33e83081d5c3f6f3fab5e5388b
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00022-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ae5328af3b113b0d83f9fa440efa444797764ae3a7fdcd4ab8f95e9e03c4e09
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00023-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:930778bd6a7801acfa78251d7bc8e8c545c2311543178f93a952de98f461795e
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00024-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:354572422f7050b018ea2715d812dbbfa31e9d3bc9d3978f857670ed3501c86b
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00025-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e75ef057d8eb6a7c3c535db36f489a19bce7a47deefafed0b26795882b77020
3
+ size 192966403
flan-t5-xl-sharded/pytorch_model-00026-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77b786049cb6ee209849da9af47b26919b79371f43ee9496cee89523d1dace13
3
+ size 176185767
flan-t5-xl-sharded/pytorch_model-00027-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2823d92db9d934c85aa49cdb2b227fb9816fdd4329b5cfb0160071b5b402b890
3
+ size 184569603
flan-t5-xl-sharded/pytorch_model-00028-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81f381ac907ea41fd40a2b1e18c397c239d834f953987b8a0989a01c5e33fd88
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00029-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5525ddcda6c2231f9e3dde783d813e592343eade112ad782dda7469c91dbc070
3
+ size 184569603
flan-t5-xl-sharded/pytorch_model-00030-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c5cc30772c34366157e3b781e81406719ab06cdf7d18d5dde4789f9a17d9c3b
3
+ size 176189799
flan-t5-xl-sharded/pytorch_model-00031-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:648601c536093c795b4df9ff7f449a7c258471858ad3ecfe5238a526d0805fde
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00032-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:000b61ac3433bec98025a09e82c979669d4a62a0968930a53ed4e09316d9665a
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00033-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b0649385d3d887b66805d8bc27e5c4cc234c1ff09eeedabc7b4d2f1f157a940
3
+ size 176181333
flan-t5-xl-sharded/pytorch_model-00034-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31d4950586b474638996d20caa8ccaecfb4897ca075708b28907076e8a8e1b14
3
+ size 184569603
flan-t5-xl-sharded/pytorch_model-00035-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8608e2ff1a9114545cca624238e96b68f0dec3e1e597e8fd415f2a630cffef9b
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00036-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d71b1b3368f33e8b9523ce4a2af076686b4a1d8638810213e4e7e87191eaf26
3
+ size 184569603
flan-t5-xl-sharded/pytorch_model-00037-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:178140a6a34e3a51cbb4a75269972c25048e9a398bb7cb46880a0bf913f52eee
3
+ size 176189799
flan-t5-xl-sharded/pytorch_model-00038-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:238ebbba5fb3c3f451ebbae08f853d709d1ab46e131006bf4627be883a9aa218
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00039-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:219a788632d3351a2859bc8fbd1dc9274d3b31a9cdedee981f32ecc0f57a327d
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00040-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48dcf52943a5eeaa952a0248d87a52fdb5e40a9fdc9d4829af05e23db02546d1
3
+ size 176181333
flan-t5-xl-sharded/pytorch_model-00041-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce8e14264025cea38ad9116b699ad8b9da94172e0a1ba949e1bc42d0fa2bab33
3
+ size 184569603
flan-t5-xl-sharded/pytorch_model-00042-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2486a013ac906485abf898c1bb60b1f49e5c5aa3ebb8e3d595cffb4d10863eba
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00043-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a80f2c41a0367714a6421bbce026f907e83472ee748d2440c3e30f77ae9d3e11
3
+ size 184569603
flan-t5-xl-sharded/pytorch_model-00044-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d018671aff30d92383920ecbee15f1e889b5086bd03a1a05c48a2915e92c902
3
+ size 176189799
flan-t5-xl-sharded/pytorch_model-00045-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3ea607280ed5fe1518764592239522be60a1751302b9e7530a53d5809899e57
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00046-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b240b3d1a526fe7f47b570aff1b87038e2ec81830462403c1feb7f2d85157704
3
+ size 192957874
flan-t5-xl-sharded/pytorch_model-00047-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0dbfe60ef4113541d0450628acb73b4a51bf47edf54c2c079bd324314b98c1ce
3
+ size 176181333
flan-t5-xl-sharded/pytorch_model-00048-of-00060.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:175e69c16deff4f9d691367c22af4685c7c4605154b3ec637dffee13ac2a3a5d
3
+ size 184569603