End of training

Browse files

Files changed (15) hide show

added_tokens.json +1 -3
config.json +17 -16
generation_config.json +2 -1
merges.txt +0 -0
pytorch_model.bin +2 -2
runs/May19_11-51-14_DESKTOP-2LG01LF/1684461077.901282/events.out.tfevents.1684461077.DESKTOP-2LG01LF.12500.1 +3 -0
runs/May19_11-51-14_DESKTOP-2LG01LF/events.out.tfevents.1684461077.DESKTOP-2LG01LF.12500.0 +3 -0
runs/May19_11-54-25_DESKTOP-2LG01LF/1684461269.4669511/events.out.tfevents.1684461269.DESKTOP-2LG01LF.12500.3 +3 -0
runs/May19_11-54-25_DESKTOP-2LG01LF/events.out.tfevents.1684461269.DESKTOP-2LG01LF.12500.2 +3 -0
runs/May19_11-57-09_DESKTOP-2LG01LF/1684461433.3930838/events.out.tfevents.1684461433.DESKTOP-2LG01LF.12500.5 +3 -0
runs/May19_11-57-09_DESKTOP-2LG01LF/events.out.tfevents.1684461433.DESKTOP-2LG01LF.12500.4 +3 -0
special_tokens_map.json +22 -4
tokenizer_config.json +6 -6
training_args.bin +1 -1
vocab.json +2 -2

added_tokens.json CHANGED Viewed

@@ -1,5 +1,3 @@
 {
-  "</s>": 54944,
-  "<mask>": 54946,
-  "<s>": 54945
 }

 {
+  "<mask>": 8008
 }

config.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
-  "_name_or_path": "facebook/blenderbot_small-90m",
   "activation_dropout": 0.0,
   "activation_function": "gelu",
   "add_bias_logits": false,
-  "add_final_layer_norm": false,
   "architectures": [
     "BlenderbotForConditionalGeneration"
   ],
@@ -11,20 +11,21 @@
   "bos_token_id": 1,
   "classif_dropout": 0.0,
   "classifier_dropout": 0.0,
-  "d_model": 512,
-  "decoder_attention_heads": 16,
-  "decoder_ffn_dim": 2048,
   "decoder_layerdrop": 0.0,
-  "decoder_layers": 8,
   "decoder_start_token_id": 1,
   "do_blenderbot_90_layernorm": true,
   "dropout": 0.1,
-  "encoder_attention_heads": 16,
-  "encoder_ffn_dim": 2048,
   "encoder_layerdrop": 0.0,
-  "encoder_layers": 8,
   "encoder_no_repeat_ngram_size": 3,
   "eos_token_id": 2,
   "extra_pos_embeddings": 0,
   "force_bos_token_to_be_generated": false,
   "forced_eos_token_id": 2,
@@ -41,17 +42,17 @@
     "LABEL_1": 1,
     "LABEL_2": 2
   },
-  "layernorm_variant": "xlm",
   "length_penalty": 0.65,
-  "max_length": 128,
-  "max_position_embeddings": 512,
   "min_length": 20,
   "model_type": "blenderbot",
   "no_repeat_ngram_size": 3,
-  "normalize_before": false,
-  "normalize_embedding": true,
   "num_beams": 10,
-  "num_hidden_layers": 8,
   "pad_token_id": 0,
   "scale_embedding": true,
   "static_position_embeddings": false,
@@ -59,5 +60,5 @@
   "transformers_version": "4.29.1",
   "unk_token_id": 3,
   "use_cache": true,
-  "vocab_size": 54944
 }

 {
+  "_name_or_path": "facebook/blenderbot-400M-distill",
   "activation_dropout": 0.0,
   "activation_function": "gelu",
   "add_bias_logits": false,
+  "add_final_layer_norm": true,
   "architectures": [
     "BlenderbotForConditionalGeneration"
   ],
   "bos_token_id": 1,
   "classif_dropout": 0.0,
   "classifier_dropout": 0.0,
+  "d_model": 1280,
+  "decoder_attention_heads": 32,
+  "decoder_ffn_dim": 5120,
   "decoder_layerdrop": 0.0,
+  "decoder_layers": 12,
   "decoder_start_token_id": 1,
   "do_blenderbot_90_layernorm": true,
   "dropout": 0.1,
+  "encoder_attention_heads": 32,
+  "encoder_ffn_dim": 5120,
   "encoder_layerdrop": 0.0,
+  "encoder_layers": 2,
   "encoder_no_repeat_ngram_size": 3,
   "eos_token_id": 2,
+  "extra_layer_norm": false,
   "extra_pos_embeddings": 0,
   "force_bos_token_to_be_generated": false,
   "forced_eos_token_id": 2,
     "LABEL_1": 1,
     "LABEL_2": 2
   },
+  "layernorm_variant": "prelayernorm",
   "length_penalty": 0.65,
+  "max_length": 60,
+  "max_position_embeddings": 128,
   "min_length": 20,
   "model_type": "blenderbot",
   "no_repeat_ngram_size": 3,
+  "normalize_before": true,
+  "normalize_embedding": false,
   "num_beams": 10,
+  "num_hidden_layers": 2,
   "pad_token_id": 0,
   "scale_embedding": true,
   "static_position_embeddings": false,
   "transformers_version": "4.29.1",
   "unk_token_id": 3,
   "use_cache": true,
+  "vocab_size": 8008
 }

generation_config.json CHANGED Viewed

@@ -2,10 +2,11 @@
   "_from_model_config": true,
   "bos_token_id": 1,
   "decoder_start_token_id": 1,
   "eos_token_id": 2,
   "forced_eos_token_id": 2,
   "length_penalty": 0.65,
-  "max_length": 128,
   "min_length": 20,
   "no_repeat_ngram_size": 3,
   "num_beams": 10,

   "_from_model_config": true,
   "bos_token_id": 1,
   "decoder_start_token_id": 1,
+  "encoder_no_repeat_ngram_size": 3,
   "eos_token_id": 2,
   "forced_eos_token_id": 2,
   "length_penalty": 0.65,
+  "max_length": 60,
   "min_length": 20,
   "no_repeat_ngram_size": 3,
   "num_beams": 10,

merges.txt CHANGED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:08cf310e873f501575b0742cd7ed436342df2fd17047749dc9a689a09665279b
-size 350368045

 version https://git-lfs.github.com/spec/v1
+oid sha256:b9680b47d359a3349cf9d3a4d0262dc3fc96988a017c0d7dab1a8776a65da219
+size 1459357453

runs/May19_11-51-14_DESKTOP-2LG01LF/1684461077.901282/events.out.tfevents.1684461077.DESKTOP-2LG01LF.12500.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8db77e2c546916ad27b750d5b81bbb4abbcb7d2d2e7de733ff3b689051376fe9
+size 5886

runs/May19_11-51-14_DESKTOP-2LG01LF/events.out.tfevents.1684461077.DESKTOP-2LG01LF.12500.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:06cb98adcac4fe0c65d66d33bf13b404e27ea74330380a942284da111296be7b
+size 4943

runs/May19_11-54-25_DESKTOP-2LG01LF/1684461269.4669511/events.out.tfevents.1684461269.DESKTOP-2LG01LF.12500.3 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:795b3064a0db10cedf5ea6e85db9de17e9b561fccfd904b0421a3fab282d47b7
+size 5886

runs/May19_11-54-25_DESKTOP-2LG01LF/events.out.tfevents.1684461269.DESKTOP-2LG01LF.12500.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2107dcb17e7ca2790bbb47ae3165f68d8f27adb330495ace2a2292f5595f73a9
+size 4943

runs/May19_11-57-09_DESKTOP-2LG01LF/1684461433.3930838/events.out.tfevents.1684461433.DESKTOP-2LG01LF.12500.5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5ed238b18161c792706a346668180c9e933f782902c3e739e4bfea2109c59ecc
+size 5886

runs/May19_11-57-09_DESKTOP-2LG01LF/events.out.tfevents.1684461433.DESKTOP-2LG01LF.12500.4 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c7a565872a2360580bd6aafb1ca2021ca5822d7d55af9f45a89c5b035efbebfd
+size 5297

special_tokens_map.json CHANGED Viewed

@@ -1,5 +1,11 @@
 {
-  "bos_token": "__start__",
   "cls_token": {
     "content": "<s>",
     "lstrip": false,
@@ -7,7 +13,13 @@
     "rstrip": false,
     "single_word": false
   },
-  "eos_token": "__end__",
   "mask_token": {
     "content": "<mask>",
     "lstrip": true,
@@ -15,7 +27,7 @@
     "rstrip": false,
     "single_word": false
   },
-  "pad_token": "__end__",
   "sep_token": {
     "content": "</s>",
     "lstrip": false,
@@ -23,5 +35,11 @@
     "rstrip": false,
     "single_word": false
   },
-  "unk_token": "__unk__"
 }

 {
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
   "cls_token": {
     "content": "<s>",
     "lstrip": false,
     "rstrip": false,
     "single_word": false
   },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
   "mask_token": {
     "content": "<mask>",
     "lstrip": true,
     "rstrip": false,
     "single_word": false
   },
+  "pad_token": "</s>",
   "sep_token": {
     "content": "</s>",
     "lstrip": false,
     "rstrip": false,
     "single_word": false
   },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
 }

tokenizer_config.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
-  "add_prefix_space": false,
   "bos_token": {
     "__type": "AddedToken",
-    "content": "__start__",
     "lstrip": false,
     "normalized": true,
     "rstrip": false,
@@ -19,7 +19,7 @@
   },
   "eos_token": {
     "__type": "AddedToken",
-    "content": "__end__",
     "lstrip": false,
     "normalized": true,
     "rstrip": false,
@@ -34,10 +34,10 @@
     "rstrip": false,
     "single_word": false
   },
-  "model_max_length": 1000000000000000019884624838656,
   "pad_token": {
     "__type": "AddedToken",
-    "content": "__null__",
     "lstrip": false,
     "normalized": true,
     "rstrip": false,
@@ -55,7 +55,7 @@
   "tokenizer_file": null,
   "unk_token": {
     "__type": "AddedToken",
-    "content": "__unk__",
     "lstrip": false,
     "normalized": true,
     "rstrip": false,

 {
+  "add_prefix_space": true,
   "bos_token": {
     "__type": "AddedToken",
+    "content": "<s>",
     "lstrip": false,
     "normalized": true,
     "rstrip": false,
   },
   "eos_token": {
     "__type": "AddedToken",
+    "content": "</s>",
     "lstrip": false,
     "normalized": true,
     "rstrip": false,
     "rstrip": false,
     "single_word": false
   },
+  "model_max_length": 128,
   "pad_token": {
     "__type": "AddedToken",
+    "content": "<pad>",
     "lstrip": false,
     "normalized": true,
     "rstrip": false,
   "tokenizer_file": null,
   "unk_token": {
     "__type": "AddedToken",
+    "content": "<unk>",
     "lstrip": false,
     "normalized": true,
     "rstrip": false,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:483b092b54aedf4108f3ec7b4514dc8cfb39d413cdcda330edab1d33381e427e
 size 3899

 version https://git-lfs.github.com/spec/v1
+oid sha256:177de5e413c9a9a8ff0a26ad97f28132925b508b85c111b7693ca0bdc1176647
 size 3899

vocab.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b8832092c8d923f8e995a0363a4d1caa5741d080d88367244098f9c553439da5
-size 1046602

 version https://git-lfs.github.com/spec/v1
+oid sha256:64c648ba108a954432cac35063663611942b734416caf91147dda23064a753de
+size 150920