fpuentes commited on Feb 5, 2023

Commit

6c164fe

•

1 Parent(s): 8affacd

Training in progress, step 1500

Browse files

Files changed (27) hide show

config.json +5 -6
events.out.tfevents.1675021526.turing.3715.0 → events.out.tfevents.1675621105.turing.942264.0 +1 -1
last-checkpoint/config.json +5 -6
last-checkpoint/merges.txt +0 -0
last-checkpoint/optimizer.pt +2 -2
last-checkpoint/pytorch_model.bin +2 -2
last-checkpoint/rng_state.pth +2 -2
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/special_tokens_map.json +15 -0
last-checkpoint/tokenizer.json +0 -0
last-checkpoint/tokenizer_config.json +17 -0
last-checkpoint/trainer_state.json +15 -85
last-checkpoint/training_args.bin +2 -2
last-checkpoint/vocab.json +0 -0
merges.txt +0 -0
pytorch_model.bin +2 -2
events.out.tfevents.1675021708.turing.3779.0 → runs/Feb05_19-18-25_turing/1675621116.2988715/events.out.tfevents.1675621116.turing.942264.2 +2 -2
events.out.tfevents.1675021876.turing.3907.0 → runs/Feb05_19-18-25_turing/events.out.tfevents.1675621116.turing.942264.1 +2 -2
runs/Jan29_20-48-28_turing/1675021713.9660718/events.out.tfevents.1675021713.turing.3779.2 +0 -3
runs/Jan29_20-48-28_turing/events.out.tfevents.1675021713.turing.3779.1 +0 -3
runs/Jan29_20-51-16_turing/1675021882.0657997/events.out.tfevents.1675021882.turing.3907.2 +0 -3
runs/Jan29_20-51-16_turing/events.out.tfevents.1675021882.turing.3907.1 +0 -3
special_tokens_map.json +15 -0
tokenizer.json +0 -0
tokenizer_config.json +17 -0
training_args.bin +2 -2
vocab.json +0 -0

config.json CHANGED Viewed

@@ -7,22 +7,21 @@
   "bos_token_id": 0,
   "classifier_dropout": null,
   "eos_token_id": 2,
-  "gradient_checkpointing": false,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
-  "hidden_size": 1024,
   "initializer_range": 0.02,
   "intermediate_size": 3072,
-  "layer_norm_eps": 1e-12,
   "max_position_embeddings": 514,
   "model_type": "roberta",
-  "num_attention_heads": 16,
   "num_hidden_layers": 12,
   "pad_token_id": 1,
   "position_embedding_type": "absolute",
   "torch_dtype": "float32",
-  "transformers_version": "4.25.1",
   "type_vocab_size": 1,
   "use_cache": true,
-  "vocab_size": 31002
 }

   "bos_token_id": 0,
   "classifier_dropout": null,
   "eos_token_id": 2,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
   "initializer_range": 0.02,
   "intermediate_size": 3072,
+  "layer_norm_eps": 1e-05,
   "max_position_embeddings": 514,
   "model_type": "roberta",
+  "num_attention_heads": 12,
   "num_hidden_layers": 12,
   "pad_token_id": 1,
   "position_embedding_type": "absolute",
   "torch_dtype": "float32",
+  "transformers_version": "4.24.0",
   "type_vocab_size": 1,
   "use_cache": true,
+  "vocab_size": 50265
 }

events.out.tfevents.1675021526.turing.3715.0 → events.out.tfevents.1675621105.turing.942264.0 RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d1038493fef059d45cb8f30efaeedca4c0fa3d49da4222e5f042315468cf90cb
 size 40

 version https://git-lfs.github.com/spec/v1
+oid sha256:4c4d0b29a87af88921abbc7c91b319bfe532dd747826d11b12e0c0dd1cebc89a
 size 40

last-checkpoint/config.json CHANGED Viewed

@@ -7,22 +7,21 @@
   "bos_token_id": 0,
   "classifier_dropout": null,
   "eos_token_id": 2,
-  "gradient_checkpointing": false,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
-  "hidden_size": 1024,
   "initializer_range": 0.02,
   "intermediate_size": 3072,
-  "layer_norm_eps": 1e-12,
   "max_position_embeddings": 514,
   "model_type": "roberta",
-  "num_attention_heads": 16,
   "num_hidden_layers": 12,
   "pad_token_id": 1,
   "position_embedding_type": "absolute",
   "torch_dtype": "float32",
-  "transformers_version": "4.25.1",
   "type_vocab_size": 1,
   "use_cache": true,
-  "vocab_size": 31002
 }

   "bos_token_id": 0,
   "classifier_dropout": null,
   "eos_token_id": 2,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
   "initializer_range": 0.02,
   "intermediate_size": 3072,
+  "layer_norm_eps": 1e-05,
   "max_position_embeddings": 514,
   "model_type": "roberta",
+  "num_attention_heads": 12,
   "num_hidden_layers": 12,
   "pad_token_id": 1,
   "position_embedding_type": "absolute",
   "torch_dtype": "float32",
+  "transformers_version": "4.24.0",
   "type_vocab_size": 1,
   "use_cache": true,
+  "vocab_size": 50265
 }

last-checkpoint/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e554af5d331128c984ad1b13951ca2c1f493a4b58f00f9dd426cc4e4f5c8e902
-size 1274845829

 version https://git-lfs.github.com/spec/v1
+oid sha256:778b67aa071ed05f42167ed3e5e86b6dae8ccfa222e2ddaabc7ca96c4f125bcb
+size 997747845

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:699cf7e95aa4b428b6dcb17ea96d0a494fb5a668588cb15688d1dfa322b651bf
-size 637412409

 version https://git-lfs.github.com/spec/v1
+oid sha256:890934702d88a0dd6337ebc6b82e6cf5721b9eacf995d6cf26ca8604fbb86a4c
+size 498863417

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:350d8425314e155ec159c0e54caa815e16c9d40828c0e9924a6a994aadfbf4b9
-size 14639

 version https://git-lfs.github.com/spec/v1
+oid sha256:22df86520474a41b29bc3648b0a45c593feb726c65d968ff4be10a14325dda87
+size 14575

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:783327ca172834179676ad8d44cd332681cd4b6b75c6ae1ec2a8870e758409a8
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:69f0ca3db667ccea99a40abd479b8edea284c7dd390646a368deb8fde2a0bf56
 size 627

last-checkpoint/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": {
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "unk_token": "<unk>"
+}

last-checkpoint/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

last-checkpoint/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "add_prefix_space": false,
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "errors": "replace",
+  "mask_token": "<mask>",
+  "max_len": 512,
+  "model_max_length": 512,
+  "name_or_path": "/home/pcjf/CESGA/works/lmodels/models/large",
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "special_tokens_map_file": null,
+  "tokenizer_class": "RobertaTokenizer",
+  "trim_offsets": true,
+  "unk_token": "<unk>"
+}

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,100 +1,30 @@
 {
-  "best_metric": 7.145984172821045,
-  "best_model_checkpoint": "/home/pcjf/CESGA/works/lmodels/models/large/checkpoint-9000",
-  "epoch": 8.130066613977645,
-  "global_step": 9000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 1.35,
-      "learning_rate": 0.00045483288166215,
-      "loss": 7.1968,
       "step": 1500
     },
     {
-      "epoch": 1.35,
-      "eval_loss": 7.1723456382751465,
-      "eval_runtime": 109.6198,
-      "eval_samples_per_second": 104.835,
-      "eval_steps_per_second": 13.109,
       "step": 1500
-    },
-    {
-      "epoch": 2.71,
-      "learning_rate": 0.00040966576332429996,
-      "loss": 7.1649,
-      "step": 3000
-    },
-    {
-      "epoch": 2.71,
-      "eval_loss": 7.157505035400391,
-      "eval_runtime": 108.8688,
-      "eval_samples_per_second": 105.558,
-      "eval_steps_per_second": 13.199,
-      "step": 3000
-    },
-    {
-      "epoch": 4.07,
-      "learning_rate": 0.0003644986449864499,
-      "loss": 7.1627,
-      "step": 4500
-    },
-    {
-      "epoch": 4.07,
-      "eval_loss": 7.15585994720459,
-      "eval_runtime": 109.3225,
-      "eval_samples_per_second": 105.12,
-      "eval_steps_per_second": 13.145,
-      "step": 4500
-    },
-    {
-      "epoch": 5.42,
-      "learning_rate": 0.00031933152664859985,
-      "loss": 7.1568,
-      "step": 6000
-    },
-    {
-      "epoch": 5.42,
-      "eval_loss": 7.157613754272461,
-      "eval_runtime": 108.7319,
-      "eval_samples_per_second": 105.691,
-      "eval_steps_per_second": 13.216,
-      "step": 6000
-    },
-    {
-      "epoch": 6.77,
-      "learning_rate": 0.00027416440831074977,
-      "loss": 7.1594,
-      "step": 7500
-    },
-    {
-      "epoch": 6.77,
-      "eval_loss": 7.1492695808410645,
-      "eval_runtime": 122.6861,
-      "eval_samples_per_second": 93.67,
-      "eval_steps_per_second": 11.713,
-      "step": 7500
-    },
-    {
-      "epoch": 8.13,
-      "learning_rate": 0.00022899728997289974,
-      "loss": 7.156,
-      "step": 9000
-    },
-    {
-      "epoch": 8.13,
-      "eval_loss": 7.145984172821045,
-      "eval_runtime": 111.6951,
-      "eval_samples_per_second": 102.887,
-      "eval_steps_per_second": 12.865,
-      "step": 9000
     }
   ],
-  "max_steps": 16605,
-  "num_train_epochs": 15,
-  "total_flos": 4.202170346996529e+17,
   "trial_name": null,
   "trial_params": null
 }

 {
+  "best_metric": 6.199821949005127,
+  "best_model_checkpoint": "/home/pcjf/CESGA/works/lmodels/models/large/checkpoint-1500",
+  "epoch": 0.215964257915315,
+  "global_step": 1500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.22,
+      "learning_rate": 7.840172786177106e-06,
+      "loss": 6.8838,
       "step": 1500
     },
     {
+      "epoch": 0.22,
+      "eval_loss": 6.199821949005127,
+      "eval_runtime": 80.1923,
+      "eval_samples_per_second": 226.281,
+      "eval_steps_per_second": 28.294,
       "step": 1500
     }
   ],
+  "max_steps": 6945,
+  "num_train_epochs": 1,
+  "total_flos": 2.248528520339957e+16,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6c8cbf8cbcd2df689edcbeb8d33a558e8a91512021cd69e68769dce93442d595
-size 3515

 version https://git-lfs.github.com/spec/v1
+oid sha256:8ac315fb6f01a713c35d8bb0bc140e603ae3fc1ed639b8dd43fdc17fa5a664b6
+size 3451

last-checkpoint/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

merges.txt CHANGED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:699cf7e95aa4b428b6dcb17ea96d0a494fb5a668588cb15688d1dfa322b651bf
-size 637412409

 version https://git-lfs.github.com/spec/v1
+oid sha256:890934702d88a0dd6337ebc6b82e6cf5721b9eacf995d6cf26ca8604fbb86a4c
+size 498863417

events.out.tfevents.1675021708.turing.3779.0 → runs/Feb05_19-18-25_turing/1675621116.2988715/events.out.tfevents.1675621116.turing.942264.2 RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:41a3986edb4f5b1ebd47f1d95a924a0276b7a6d51c1a727306d6a9102b0e1261
-size 40

 version https://git-lfs.github.com/spec/v1
+oid sha256:64433e0512fffedcc9808dc13c2552a1d0628e378a1393a3e8d280019fade8f2
+size 5579

events.out.tfevents.1675021876.turing.3907.0 → runs/Feb05_19-18-25_turing/events.out.tfevents.1675621116.turing.942264.1 RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5fae8754d53b80ee4c1b0ee5802b17e0247a6fa53c691fb9842c2931611a4296
-size 40

 version https://git-lfs.github.com/spec/v1
+oid sha256:866688278b7caac7e71346cdddf3f728327008fe07a5c38f6e0ae3f7355eaf1d
+size 4268

runs/Jan29_20-48-28_turing/1675021713.9660718/events.out.tfevents.1675021713.turing.3779.2 DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:c29ec387e33077a1ee7b926d1a50160a6f8df4c22c40857b26082ca101531453
-size 5617

runs/Jan29_20-48-28_turing/events.out.tfevents.1675021713.turing.3779.1 DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:6e68ff533ed530838828a7c4bb350a275f3cb8f453940d9cd9b7e428c1621019
-size 3906

runs/Jan29_20-51-16_turing/1675021882.0657997/events.out.tfevents.1675021882.turing.3907.2 DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:0ca9e89ce53904409eef3f68013ef63b67fb63775898a5b46e336d2772178087
-size 5617

runs/Jan29_20-51-16_turing/events.out.tfevents.1675021882.turing.3907.1 DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:89fd4db54cb44d24148ee660b09cd2d215ff69c4f141b45ea214ca6657e325b5
-size 6475

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": {
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "unk_token": "<unk>"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "add_prefix_space": false,
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "errors": "replace",
+  "mask_token": "<mask>",
+  "max_len": 512,
+  "model_max_length": 512,
+  "name_or_path": "/home/pcjf/CESGA/works/lmodels/models/large",
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "special_tokens_map_file": null,
+  "tokenizer_class": "RobertaTokenizer",
+  "trim_offsets": true,
+  "unk_token": "<unk>"
+}

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6c8cbf8cbcd2df689edcbeb8d33a558e8a91512021cd69e68769dce93442d595
-size 3515

 version https://git-lfs.github.com/spec/v1
+oid sha256:8ac315fb6f01a713c35d8bb0bc140e603ae3fc1ed639b8dd43fdc17fa5a664b6
+size 3451

vocab.json CHANGED Viewed

The diff for this file is too large to render. See raw diff