pere commited on
Commit
1247d97
1 Parent(s): e91f263

fixing bug

Browse files

Files changed (5) hide show
  1. README.md +3 -1
  2. added_tokens.json +1 -1
  3. config.json +2 -2
  4. pytorch_model.bin +3 -0
  5. tokenizer_config.json +1 -1
README.md CHANGED
@@ -11,7 +11,9 @@ datasets:
11
 
12
  This is a Norwegian T5-base model trained on the Norwegian Colossal Corpus (NCC) on a TPU v3-8. It needs to be finetuned on a specific task before being used for anything.
13
 
14
- The following setting were used in training:
 
 
15
  ```bash
16
  ./run_t5_mlm_flax_streaming.py \
17
  --output_dir="./" \
11
 
12
  This is a Norwegian T5-base model trained on the Norwegian Colossal Corpus (NCC) on a TPU v3-8. It needs to be finetuned on a specific task before being used for anything.
13
 
14
+ Currently the model is training. It is expected that it should be finished by the end of August 2021.
15
+
16
+ The following setting were used in training:
17
  ```bash
18
  ./run_t5_mlm_flax_streaming.py \
19
  --output_dir="./" \
added_tokens.json CHANGED
@@ -1 +1 @@
1
- {"<extra_id_95>": 50098, "<extra_id_25>": 50028, "<extra_id_8>": 50011, "<extra_id_97>": 50100, "<extra_id_83>": 50086, "<extra_id_46>": 50049, "<extra_id_86>": 50089, "<extra_id_3>": 50006, "<extra_id_73>": 50076, "<extra_id_16>": 50019, "<extra_id_67>": 50070, "<extra_id_56>": 50059, "<extra_id_7>": 50010, "<extra_id_13>": 50016, "<extra_id_94>": 50097, "<extra_id_87>": 50090, "<extra_id_21>": 50024, "<extra_id_32>": 50035, "<extra_id_43>": 50046, "<extra_id_27>": 50030, "<extra_id_35>": 50038, "<extra_id_47>": 50050, "<extra_id_5>": 50008, "<extra_id_31>": 50034, "<extra_id_23>": 50026, "<extra_id_26>": 50029, "<extra_id_40>": 50043, "<extra_id_10>": 50013, "<extra_id_0>": 50003, "<extra_id_71>": 50074, "<extra_id_80>": 50083, "<extra_id_76>": 50079, "<extra_id_62>": 50065, "<extra_id_93>": 50096, "<extra_id_64>": 50067, "<extra_id_24>": 50027, "<extra_id_96>": 50099, "<extra_id_9>": 50012, "<extra_id_38>": 50041, "<extra_id_84>": 50087, "<extra_id_50>": 50053, "<extra_id_17>": 50020, "<extra_id_34>": 50037, "<extra_id_30>": 50033, "<extra_id_58>": 50061, "<extra_id_72>": 50075, "<extra_id_39>": 50042, "<extra_id_68>": 50071, "<extra_id_36>": 50039, "<extra_id_44>": 50047, "<extra_id_20>": 50023, "<extra_id_49>": 50052, "<extra_id_61>": 50064, "<extra_id_54>": 50057, "<extra_id_12>": 50015, "<extra_id_6>": 50009, "<extra_id_59>": 50062, "<extra_id_89>": 50092, "<extra_id_51>": 50054, "<extra_id_74>": 50077, "<extra_id_28>": 50031, "<extra_id_22>": 50025, "<extra_id_37>": 50040, "<extra_id_65>": 50068, "<extra_id_29>": 50032, "<extra_id_82>": 50085, "<extra_id_75>": 50078, "<extra_id_88>": 50091, "<extra_id_2>": 50005, "<extra_id_14>": 50017, "<extra_id_57>": 50060, "<extra_id_41>": 50044, "<extra_id_63>": 50066, "<extra_id_48>": 50051, "<extra_id_1>": 50004, "<extra_id_99>": 50102, "<extra_id_98>": 50101, "<extra_id_33>": 50036, "<extra_id_52>": 50055, "<extra_id_15>": 50018, "<extra_id_45>": 50048, "<extra_id_55>": 50058, "<extra_id_92>": 50095, "<extra_id_90>": 50093, "<extra_id_85>": 50088, "<extra_id_60>": 50063, "<extra_id_77>": 50080, "<extra_id_66>": 50069, "<extra_id_18>": 50021, "<extra_id_91>": 50094, "<extra_id_11>": 50014, "<extra_id_78>": 50081, "<extra_id_81>": 50084, "<extra_id_70>": 50073, "<extra_id_4>": 50007, "<extra_id_79>": 50082, "<extra_id_53>": 50056, "<extra_id_42>": 50045, "<extra_id_69>": 50072, "<extra_id_19>": 50022}
1
+ {"<extra_id_98>": 50101, "<extra_id_26>": 50029, "<extra_id_8>": 50011, "<extra_id_56>": 50059, "<extra_id_29>": 50032, "<extra_id_75>": 50078, "<extra_id_36>": 50039, "<extra_id_86>": 50089, "<extra_id_16>": 50019, "<extra_id_42>": 50045, "<extra_id_6>": 50009, "<extra_id_14>": 50017, "<extra_id_2>": 50005, "<extra_id_53>": 50056, "<extra_id_7>": 50010, "<extra_id_88>": 50091, "<extra_id_32>": 50035, "<extra_id_18>": 50021, "<extra_id_37>": 50040, "<extra_id_24>": 50027, "<extra_id_68>": 50071, "<extra_id_92>": 50095, "<extra_id_33>": 50036, "<extra_id_60>": 50063, "<extra_id_99>": 50102, "<extra_id_59>": 50062, "<extra_id_77>": 50080, "<extra_id_15>": 50018, "<extra_id_10>": 50013, "<extra_id_45>": 50048, "<extra_id_31>": 50034, "<extra_id_0>": 50003, "<extra_id_58>": 50061, "<extra_id_48>": 50051, "<extra_id_74>": 50077, "<extra_id_47>": 50050, "<extra_id_82>": 50085, "<extra_id_61>": 50064, "<extra_id_46>": 50049, "<extra_id_96>": 50099, "<extra_id_78>": 50081, "<extra_id_50>": 50053, "<extra_id_90>": 50093, "<extra_id_11>": 50014, "<extra_id_22>": 50025, "<extra_id_65>": 50068, "<extra_id_63>": 50066, "<extra_id_89>": 50092, "<extra_id_17>": 50020, "<extra_id_28>": 50031, "<extra_id_43>": 50046, "<extra_id_13>": 50016, "<extra_id_84>": 50087, "<extra_id_21>": 50024, "<extra_id_64>": 50067, "<extra_id_76>": 50079, "<extra_id_23>": 50026, "<extra_id_79>": 50082, "<extra_id_67>": 50070, "<extra_id_3>": 50006, "<extra_id_62>": 50065, "<extra_id_19>": 50022, "<extra_id_27>": 50030, "<extra_id_55>": 50058, "<extra_id_73>": 50076, "<extra_id_87>": 50090, "<extra_id_54>": 50057, "<extra_id_83>": 50086, "<extra_id_91>": 50094, "<extra_id_35>": 50038, "<extra_id_30>": 50033, "<extra_id_49>": 50052, "<extra_id_72>": 50075, "<extra_id_94>": 50097, "<extra_id_69>": 50072, "<extra_id_25>": 50028, "<extra_id_71>": 50074, "<extra_id_80>": 50083, "<extra_id_93>": 50096, "<extra_id_57>": 50060, "<extra_id_95>": 50098, "<extra_id_97>": 50100, "<extra_id_41>": 50044, "<extra_id_20>": 50023, "<extra_id_5>": 50008, "<extra_id_34>": 50037, "<extra_id_81>": 50084, "<extra_id_85>": 50088, "<extra_id_51>": 50054, "<extra_id_52>": 50055, "<extra_id_4>": 50007, "<extra_id_9>": 50012, "<extra_id_1>": 50004, "<extra_id_44>": 50047, "<extra_id_66>": 50069, "<extra_id_40>": 50043, "<extra_id_70>": 50073, "<extra_id_12>": 50015, "<extra_id_38>": 50041, "<extra_id_39>": 50042}
config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_name_or_path": ".",
3
  "architectures": [
4
- "T5ForConditionalGeneration"
5
  ],
6
  "d_ff": 2048,
7
  "d_kv": 64,
@@ -23,7 +23,7 @@
23
  "relative_attention_num_buckets": 32,
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "float32",
26
- "transformers_version": "4.10.0.dev0",
27
  "use_cache": true,
28
  "vocab_size": 50103
29
  }
1
  {
2
  "_name_or_path": ".",
3
  "architectures": [
4
+ "T5Model"
5
  ],
6
  "d_ff": 2048,
7
  "d_kv": 64,
23
  "relative_attention_num_buckets": 32,
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "float32",
26
+ "transformers_version": "4.9.0.dev0",
27
  "use_cache": true,
28
  "vocab_size": 50103
29
  }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9cc8d879349e33182319a583fff28a3cd250f013b2de26d2e93d125b131901b
3
+ size 946956047
tokenizer_config.json CHANGED
@@ -1 +1 @@
1
- {"eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>", "extra_ids": 100, "additional_special_tokens": ["<extra_id_0>", "<extra_id_1>", "<extra_id_2>", "<extra_id_3>", "<extra_id_4>", "<extra_id_5>", "<extra_id_6>", "<extra_id_7>", "<extra_id_8>", "<extra_id_9>", "<extra_id_10>", "<extra_id_11>", "<extra_id_12>", "<extra_id_13>", "<extra_id_14>", "<extra_id_15>", "<extra_id_16>", "<extra_id_17>", "<extra_id_18>", "<extra_id_19>", "<extra_id_20>", "<extra_id_21>", "<extra_id_22>", "<extra_id_23>", "<extra_id_24>", "<extra_id_25>", "<extra_id_26>", "<extra_id_27>", "<extra_id_28>", "<extra_id_29>", "<extra_id_30>", "<extra_id_31>", "<extra_id_32>", "<extra_id_33>", "<extra_id_34>", "<extra_id_35>", "<extra_id_36>", "<extra_id_37>", "<extra_id_38>", "<extra_id_39>", "<extra_id_40>", "<extra_id_41>", "<extra_id_42>", "<extra_id_43>", "<extra_id_44>", "<extra_id_45>", "<extra_id_46>", "<extra_id_47>", "<extra_id_48>", "<extra_id_49>", "<extra_id_50>", "<extra_id_51>", "<extra_id_52>", "<extra_id_53>", "<extra_id_54>", "<extra_id_55>", "<extra_id_56>", "<extra_id_57>", "<extra_id_58>", "<extra_id_59>", "<extra_id_60>", "<extra_id_61>", "<extra_id_62>", "<extra_id_63>", "<extra_id_64>", "<extra_id_65>", "<extra_id_66>", "<extra_id_67>", "<extra_id_68>", "<extra_id_69>", "<extra_id_70>", "<extra_id_71>", "<extra_id_72>", "<extra_id_73>", "<extra_id_74>", "<extra_id_75>", "<extra_id_76>", "<extra_id_77>", "<extra_id_78>", "<extra_id_79>", "<extra_id_80>", "<extra_id_81>", "<extra_id_82>", "<extra_id_83>", "<extra_id_84>", "<extra_id_85>", "<extra_id_86>", "<extra_id_87>", "<extra_id_88>", "<extra_id_89>", "<extra_id_90>", "<extra_id_91>", "<extra_id_92>", "<extra_id_93>", "<extra_id_94>", "<extra_id_95>", "<extra_id_96>", "<extra_id_97>", "<extra_id_98>", "<extra_id_99>"], "use_fast": true, "special_tokens_map_file": null, "name_or_path": ".", "tokenizer_class": "T5Tokenizer"}
1
+ {"eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>", "extra_ids": 100, "additional_special_tokens": ["<extra_id_0>", "<extra_id_1>", "<extra_id_2>", "<extra_id_3>", "<extra_id_4>", "<extra_id_5>", "<extra_id_6>", "<extra_id_7>", "<extra_id_8>", "<extra_id_9>", "<extra_id_10>", "<extra_id_11>", "<extra_id_12>", "<extra_id_13>", "<extra_id_14>", "<extra_id_15>", "<extra_id_16>", "<extra_id_17>", "<extra_id_18>", "<extra_id_19>", "<extra_id_20>", "<extra_id_21>", "<extra_id_22>", "<extra_id_23>", "<extra_id_24>", "<extra_id_25>", "<extra_id_26>", "<extra_id_27>", "<extra_id_28>", "<extra_id_29>", "<extra_id_30>", "<extra_id_31>", "<extra_id_32>", "<extra_id_33>", "<extra_id_34>", "<extra_id_35>", "<extra_id_36>", "<extra_id_37>", "<extra_id_38>", "<extra_id_39>", "<extra_id_40>", "<extra_id_41>", "<extra_id_42>", "<extra_id_43>", "<extra_id_44>", "<extra_id_45>", "<extra_id_46>", "<extra_id_47>", "<extra_id_48>", "<extra_id_49>", "<extra_id_50>", "<extra_id_51>", "<extra_id_52>", "<extra_id_53>", "<extra_id_54>", "<extra_id_55>", "<extra_id_56>", "<extra_id_57>", "<extra_id_58>", "<extra_id_59>", "<extra_id_60>", "<extra_id_61>", "<extra_id_62>", "<extra_id_63>", "<extra_id_64>", "<extra_id_65>", "<extra_id_66>", "<extra_id_67>", "<extra_id_68>", "<extra_id_69>", "<extra_id_70>", "<extra_id_71>", "<extra_id_72>", "<extra_id_73>", "<extra_id_74>", "<extra_id_75>", "<extra_id_76>", "<extra_id_77>", "<extra_id_78>", "<extra_id_79>", "<extra_id_80>", "<extra_id_81>", "<extra_id_82>", "<extra_id_83>", "<extra_id_84>", "<extra_id_85>", "<extra_id_86>", "<extra_id_87>", "<extra_id_88>", "<extra_id_89>", "<extra_id_90>", "<extra_id_91>", "<extra_id_92>", "<extra_id_93>", "<extra_id_94>", "<extra_id_95>", "<extra_id_96>", "<extra_id_97>", "<extra_id_98>", "<extra_id_99>"], "use_fast": true, "special_tokens_map_file": null, "name_or_path": ".", "from_flax": true, "tokenizer_class": "T5Tokenizer"}