Training in progress, step 500

Browse files

Files changed (16) hide show

config.json +167 -0
model.safetensors +3 -0
runs/Jan22_10-19-55_gpu01-sensors-testing-0/events.out.tfevents.1705918832.gpu01-sensors-testing-0.228098.4 +3 -0
runs/Jan22_10-40-50_gpu01-sensors-testing-0/events.out.tfevents.1705920068.gpu01-sensors-testing-0.228098.5 +3 -0
runs/Jan22_10-42-56_gpu01-sensors-testing-0/events.out.tfevents.1705920180.gpu01-sensors-testing-0.228098.7 +3 -0
runs/Jan22_10-49-38_gpu01-sensors-testing-0/events.out.tfevents.1705920588.gpu01-sensors-testing-0.228098.8 +3 -0
runs/Jan22_10-53-09_gpu01-sensors-testing-0/events.out.tfevents.1705920792.gpu01-sensors-testing-0.228098.9 +3 -0
runs/Jan22_10-53-36_gpu01-sensors-testing-0/events.out.tfevents.1705920835.gpu01-sensors-testing-0.228098.10 +3 -0
runs/Jan22_10-55-27_gpu01-sensors-testing-0/events.out.tfevents.1705920930.gpu01-sensors-testing-0.228098.11 +3 -0
runs/Jan22_11-00-18_gpu01-sensors-testing-0/events.out.tfevents.1705921225.gpu01-sensors-testing-0.229126.0 +3 -0
runs/Jan22_11-04-09_gpu01-sensors-testing-0/events.out.tfevents.1705921450.gpu01-sensors-testing-0.229422.0 +3 -0
runs/Jan22_11-04-56_gpu01-sensors-testing-0/events.out.tfevents.1705921500.gpu01-sensors-testing-0.229422.1 +3 -0
special_tokens_map.json +4 -0
tokenizer.json +0 -0
tokenizer_config.json +12 -0
training_args.bin +3 -0

config.json ADDED Viewed

	@@ -0,0 +1,167 @@

+{
+  "architectures": [
+    "EncoderDecoderModel"
+  ],
+  "decoder": {
+    "_name_or_path": "",
+    "add_cross_attention": true,
+    "architectures": null,
+    "attention_probs_dropout_prob": 0.1,
+    "bad_words_ids": null,
+    "begin_suppress_tokens": null,
+    "bos_token_id": null,
+    "chunk_size_feed_forward": 0,
+    "classifier_dropout": null,
+    "cross_attention_hidden_size": null,
+    "decoder_start_token_id": 0,
+    "diversity_penalty": 0.0,
+    "do_sample": false,
+    "early_stopping": false,
+    "encoder_no_repeat_ngram_size": 0,
+    "eos_token_id": null,
+    "exponential_decay_length_penalty": null,
+    "finetuning_task": null,
+    "forced_bos_token_id": null,
+    "forced_eos_token_id": null,
+    "hidden_act": "gelu",
+    "hidden_dropout_prob": 0.1,
+    "hidden_size": 768,
+    "id2label": {
+      "0": "LABEL_0",
+      "1": "LABEL_1"
+    },
+    "initializer_range": 0.02,
+    "intermediate_size": 3072,
+    "is_decoder": true,
+    "is_encoder_decoder": false,
+    "label2id": {
+      "LABEL_0": 0,
+      "LABEL_1": 1
+    },
+    "layer_norm_eps": 1e-12,
+    "length_penalty": 1.0,
+    "max_length": 20,
+    "max_position_embeddings": 512,
+    "min_length": 0,
+    "model_type": "bert",
+    "no_repeat_ngram_size": 0,
+    "num_attention_heads": 12,
+    "num_beam_groups": 1,
+    "num_beams": 1,
+    "num_hidden_layers": 12,
+    "num_return_sequences": 1,
+    "output_attentions": false,
+    "output_hidden_states": false,
+    "output_scores": false,
+    "pad_token_id": 0,
+    "position_embedding_type": "absolute",
+    "prefix": null,
+    "problem_type": null,
+    "pruned_heads": {},
+    "remove_invalid_values": false,
+    "repetition_penalty": 1.0,
+    "return_dict": true,
+    "return_dict_in_generate": false,
+    "sep_token_id": null,
+    "suppress_tokens": null,
+    "task_specific_params": null,
+    "temperature": 1.0,
+    "tf_legacy_loss": false,
+    "tie_encoder_decoder": false,
+    "tie_word_embeddings": true,
+    "tokenizer_class": null,
+    "top_k": 50,
+    "top_p": 1.0,
+    "torch_dtype": null,
+    "torchscript": false,
+    "type_vocab_size": 2,
+    "typical_p": 1.0,
+    "use_bfloat16": false,
+    "use_cache": true,
+    "vocab_size": 52000
+  },
+  "decoder_start_token_id": 0,
+  "encoder": {
+    "_name_or_path": "",
+    "add_cross_attention": false,
+    "architectures": null,
+    "attention_probs_dropout_prob": 0.1,
+    "bad_words_ids": null,
+    "begin_suppress_tokens": null,
+    "bos_token_id": null,
+    "chunk_size_feed_forward": 0,
+    "classifier_dropout": null,
+    "cross_attention_hidden_size": null,
+    "decoder_start_token_id": 0,
+    "diversity_penalty": 0.0,
+    "do_sample": false,
+    "early_stopping": false,
+    "encoder_no_repeat_ngram_size": 0,
+    "eos_token_id": null,
+    "exponential_decay_length_penalty": null,
+    "finetuning_task": null,
+    "forced_bos_token_id": null,
+    "forced_eos_token_id": null,
+    "hidden_act": "gelu",
+    "hidden_dropout_prob": 0.1,
+    "hidden_size": 768,
+    "id2label": {
+      "0": "LABEL_0",
+      "1": "LABEL_1"
+    },
+    "initializer_range": 0.02,
+    "intermediate_size": 3072,
+    "is_decoder": false,
+    "is_encoder_decoder": false,
+    "label2id": {
+      "LABEL_0": 0,
+      "LABEL_1": 1
+    },
+    "layer_norm_eps": 1e-12,
+    "length_penalty": 1.0,
+    "max_length": 20,
+    "max_position_embeddings": 512,
+    "min_length": 0,
+    "model_type": "bert",
+    "no_repeat_ngram_size": 0,
+    "num_attention_heads": 12,
+    "num_beam_groups": 1,
+    "num_beams": 1,
+    "num_hidden_layers": 12,
+    "num_return_sequences": 1,
+    "output_attentions": false,
+    "output_hidden_states": false,
+    "output_scores": false,
+    "pad_token_id": 0,
+    "position_embedding_type": "absolute",
+    "prefix": null,
+    "problem_type": null,
+    "pruned_heads": {},
+    "remove_invalid_values": false,
+    "repetition_penalty": 1.0,
+    "return_dict": true,
+    "return_dict_in_generate": false,
+    "sep_token_id": null,
+    "suppress_tokens": null,
+    "task_specific_params": null,
+    "temperature": 1.0,
+    "tf_legacy_loss": false,
+    "tie_encoder_decoder": false,
+    "tie_word_embeddings": true,
+    "tokenizer_class": null,
+    "top_k": 50,
+    "top_p": 1.0,
+    "torch_dtype": null,
+    "torchscript": false,
+    "type_vocab_size": 2,
+    "typical_p": 1.0,
+    "use_bfloat16": false,
+    "use_cache": true,
+    "vocab_size": 52000
+  },
+  "is_encoder_decoder": true,
+  "model_type": "encoder-decoder",
+  "pad_token_id": 1,
+  "torch_dtype": "float32",
+  "transformers_version": "4.36.2"
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3556c47156e448bbe00e4afff2324efd103bb324b01eb3af26fc7a5a90f03674
+size 1121565672

runs/Jan22_10-19-55_gpu01-sensors-testing-0/events.out.tfevents.1705918832.gpu01-sensors-testing-0.228098.4 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:21cef90a112ba702d81ed372e20d69844537963c93a3628ffd437804483083b1
+size 8270

runs/Jan22_10-40-50_gpu01-sensors-testing-0/events.out.tfevents.1705920068.gpu01-sensors-testing-0.228098.5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f3ecc7246b7903fa2f2d39dc7f53cef3a47984e9f53155de8d5029e2e9bdf211
+size 8270

runs/Jan22_10-42-56_gpu01-sensors-testing-0/events.out.tfevents.1705920180.gpu01-sensors-testing-0.228098.7 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b8a5c52c7848e5a1368d5c9259c1b5737ae80181a35961d46c1cd3a4ea8c2f48
+size 8270

runs/Jan22_10-49-38_gpu01-sensors-testing-0/events.out.tfevents.1705920588.gpu01-sensors-testing-0.228098.8 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a6e0af3ed02765154a56599c1710d9ef010a66f85a6df37e6db92f537c1832a8
+size 8270

runs/Jan22_10-53-09_gpu01-sensors-testing-0/events.out.tfevents.1705920792.gpu01-sensors-testing-0.228098.9 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e03d65679eff5971347d8d72e567bdbaf83722b23c26eb58fdd2a4d8db385d10
+size 8267

runs/Jan22_10-53-36_gpu01-sensors-testing-0/events.out.tfevents.1705920835.gpu01-sensors-testing-0.228098.10 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5c2a015edaec2bf924bb18ab6bba20541b0cf8834a0af19484e2a23daa8e211
+size 8264

runs/Jan22_10-55-27_gpu01-sensors-testing-0/events.out.tfevents.1705920930.gpu01-sensors-testing-0.228098.11 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2741fcbaebe296a017993da16435df1922d5b59a2577a08ae9ff7c248b7486cb
+size 8316

runs/Jan22_11-00-18_gpu01-sensors-testing-0/events.out.tfevents.1705921225.gpu01-sensors-testing-0.229126.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2f77e641303902b5dc1cf09e03bc8f2d115f2f602d0b0da038f766e9ca3bacc1
+size 8312

runs/Jan22_11-04-09_gpu01-sensors-testing-0/events.out.tfevents.1705921450.gpu01-sensors-testing-0.229422.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5af49fa5e935e53c4e7c065705c4794517804ee49453983a949a4a6ca84097ce
+size 9027

runs/Jan22_11-04-56_gpu01-sensors-testing-0/events.out.tfevents.1705921500.gpu01-sensors-testing-0.229422.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e119bbe6c23df04fb3a6e252b1a36604bd2c3d3587f31b7dfd6238cc01d6e6bd
+size 22102

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{
+  "bos_token": "[BOS]",
+  "pad_token": "[PAD]"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,12 @@

+{
+  "added_tokens_decoder": {},
+  "bos_token": "[BOS]",
+  "clean_up_tokenization_spaces": true,
+  "max_length": 512,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "[PAD]",
+  "stride": 0,
+  "tokenizer_class": "PreTrainedTokenizerFast",
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:519ccf9d08aa9fe0f6cdb7f59ea53333b5aab4283fe70fedabf675b6c77c4190
+size 4411