fpuentes commited on Jan 15, 2023

Commit

0da3f6f

•

1 Parent(s): 39cec2d

Training in progress, step 500

Browse files

Files changed (35) hide show

config.json +3 -2
runs/Jan11_16-45-27_turing/1673451933.465075/events.out.tfevents.1673451933.turing.162574.1 → events.out.tfevents.1673814853.turing.327173.0 +2 -2
runs/Jan11_16-45-27_turing/events.out.tfevents.1673451933.turing.162574.0 → events.out.tfevents.1673815130.turing.327344.0 +2 -2
events.out.tfevents.1673815472.turing.327590.0 +3 -0
events.out.tfevents.1673818108.turing.328391.0 +3 -0
events.out.tfevents.1673819239.turing.328732.0 +3 -0
last-checkpoint/config.json +3 -2
last-checkpoint/optimizer.pt +2 -2
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +2 -2
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +14 -210
last-checkpoint/training_args.bin +2 -2
log.txt +0 -0
merges.txt +0 -0
pytorch_model.bin +1 -1
runs/Jan15_21-34-13_turing/1673814853.9309754/events.out.tfevents.1673814853.turing.327173.2 +3 -0
runs/Jan15_21-34-13_turing/events.out.tfevents.1673814853.turing.327173.1 +3 -0
runs/Jan15_21-38-50_turing/1673815130.6693852/events.out.tfevents.1673815130.turing.327344.2 +3 -0
runs/Jan15_21-38-50_turing/events.out.tfevents.1673815130.turing.327344.1 +3 -0
runs/Jan15_21-44-32_turing/1673815478.7136974/events.out.tfevents.1673815478.turing.327590.2 +3 -0
runs/Jan15_21-44-32_turing/1673816409.4189365/events.out.tfevents.1673816409.turing.327590.3 +3 -0
runs/Jan15_21-44-32_turing/1673816930.061229/events.out.tfevents.1673816930.turing.327590.4 +3 -0
runs/Jan15_21-44-32_turing/1673817441.0883248/events.out.tfevents.1673817441.turing.327590.5 +3 -0
runs/Jan15_21-44-32_turing/events.out.tfevents.1673815478.turing.327590.1 +3 -0
runs/Jan15_22-28-28_turing/1673818114.7901142/events.out.tfevents.1673818114.turing.328391.2 +3 -0
runs/Jan15_22-28-28_turing/events.out.tfevents.1673818114.turing.328391.1 +3 -0
runs/Jan15_22-47-19_turing/1673819245.5556467/events.out.tfevents.1673819245.turing.328732.2 +3 -0
runs/Jan15_22-47-19_turing/events.out.tfevents.1673819245.turing.328732.1 +3 -0
special_tokens_map.json +0 -51
tokenizer.json +0 -348
tokenizer_config.json +0 -64
training_args.bin +2 -2
vocab.json +0 -0

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "/home/pcjf/CESGA/works/lmodels/models/tiny",
   "architectures": [
     "RobertaForMaskedLM"
   ],
@@ -7,6 +7,7 @@
   "bos_token_id": 0,
   "classifier_dropout": null,
   "eos_token_id": 2,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
@@ -20,7 +21,7 @@
   "pad_token_id": 1,
   "position_embedding_type": "absolute",
   "torch_dtype": "float32",
-  "transformers_version": "4.24.0",
   "type_vocab_size": 1,
   "use_cache": true,
   "vocab_size": 31002

 {
+  "_name_or_path": "bert-fromscratch-galician-tiny",
   "architectures": [
     "RobertaForMaskedLM"
   ],
   "bos_token_id": 0,
   "classifier_dropout": null,
   "eos_token_id": 2,
+  "gradient_checkpointing": false,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
   "pad_token_id": 1,
   "position_embedding_type": "absolute",
   "torch_dtype": "float32",
+  "transformers_version": "4.25.1",
   "type_vocab_size": 1,
   "use_cache": true,
   "vocab_size": 31002

runs/Jan11_16-45-27_turing/1673451933.465075/events.out.tfevents.1673451933.turing.162574.1 → events.out.tfevents.1673814853.turing.327173.0 RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:853f3d8342cbd88d1830b3b8643713bfd6721a824bc6b62817b60974a961aafd
-size 5573

 version https://git-lfs.github.com/spec/v1
+oid sha256:4009989b8e0cef7be20aace5fa38745aac5d2ff88c7c166309e08ece60c96a9c
+size 40

runs/Jan11_16-45-27_turing/events.out.tfevents.1673451933.turing.162574.0 → events.out.tfevents.1673815130.turing.327344.0 RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f3a47a08f9b6acf844e52711088889527cb14f8118d384474492de659f9e07bd
-size 10249

 version https://git-lfs.github.com/spec/v1
+oid sha256:866be7fc2228533501f5b8b9fa180f7d858ef77a9d50f4e342bd7ea017618bc2
+size 40

events.out.tfevents.1673815472.turing.327590.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:39cf25e830b6100fd4e060886441e90908203afe88847298ca10d88e7ca06126
+size 40

events.out.tfevents.1673818108.turing.328391.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f2a42b6d9bbe66175c42d9b4af1832c8839d77c22a7cd49b4763e082c9936a27
+size 40

events.out.tfevents.1673819239.turing.328732.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:689679f8f31b6990b0694391fe5b7f95d3b3f65100b681df78f59dfd5b08b4b2
+size 40

last-checkpoint/config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "/home/pcjf/CESGA/works/lmodels/models/tiny",
   "architectures": [
     "RobertaForMaskedLM"
   ],
@@ -7,6 +7,7 @@
   "bos_token_id": 0,
   "classifier_dropout": null,
   "eos_token_id": 2,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
@@ -20,7 +21,7 @@
   "pad_token_id": 1,
   "position_embedding_type": "absolute",
   "torch_dtype": "float32",
-  "transformers_version": "4.24.0",
   "type_vocab_size": 1,
   "use_cache": true,
   "vocab_size": 31002

 {
+  "_name_or_path": "bert-fromscratch-galician-tiny",
   "architectures": [
     "RobertaForMaskedLM"
   ],
   "bos_token_id": 0,
   "classifier_dropout": null,
   "eos_token_id": 2,
+  "gradient_checkpointing": false,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
   "pad_token_id": 1,
   "position_embedding_type": "absolute",
   "torch_dtype": "float32",
+  "transformers_version": "4.25.1",
   "type_vocab_size": 1,
   "use_cache": true,
   "vocab_size": 31002

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:98e8a5b53b2c4d8733fa58155c862d7ad8c8ac19fc17aa2cdbeeecf969876ede
-size 538917701

 version https://git-lfs.github.com/spec/v1
+oid sha256:801c2271d8c5c89f6b75aad292987eb7be01d92eb95b460208b11f44d1aee93b
+size 538943941

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d3e60aee58bb3002247500f1d529cca009a081ea94dc8ec603e656e128eb6897
 size 269468281

 version https://git-lfs.github.com/spec/v1
+oid sha256:9d0b07c5c7fc85dd0dfb66ea5fe8504c1a41a9ec2a4fb4454228c53a694d2d63
 size 269468281

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:edb60841f841b5cc624351d65feeef8d0507231bd57b9a057376c854c4c7c2a6
-size 16619

 version https://git-lfs.github.com/spec/v1
+oid sha256:f31436e4edb8722805d32541741dbc8dc71acb0518feee9de1bd1f464719d49b
+size 14575

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:353f071a8d028751f6795b6568373c69120c80918dec3e3f3e2c2a824ed27644
 size 557

 version https://git-lfs.github.com/spec/v1
+oid sha256:a3f196a54202bb4ba1220e8c59f42f9cda0702d68ea83147d814c2fb2f36b8f2
 size 557

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:31e6790cf08ba99f982bd0658300f9c41c4317f30f220548bfd4220ffd05d922
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:420e10273b4c605eace81ed700d0fe1224720131ac4e067633f127c39edc0094
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,226 +1,30 @@
 {
-  "best_metric": 2.7213306427001953,
-  "best_model_checkpoint": "/home/pcjf/CESGA/works/lmodels/models/tiny/checkpoint-750",
-  "epoch": 4.236765612613406,
-  "global_step": 750,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 0.28,
-      "learning_rate": 9.717514124293787e-05,
-      "loss": 5.0078,
-      "step": 50
-    },
-    {
-      "epoch": 0.28,
-      "eval_loss": 3.1328039169311523,
-      "eval_runtime": 312.4569,
-      "eval_samples_per_second": 184.566,
-      "eval_steps_per_second": 7.691,
-      "step": 50
-    },
-    {
-      "epoch": 0.56,
-      "learning_rate": 9.43502824858757e-05,
-      "loss": 3.0128,
-      "step": 100
-    },
-    {
-      "epoch": 0.56,
-      "eval_loss": 2.960442304611206,
-      "eval_runtime": 311.919,
-      "eval_samples_per_second": 184.885,
-      "eval_steps_per_second": 7.704,
-      "step": 100
-    },
-    {
-      "epoch": 0.85,
-      "learning_rate": 9.152542372881357e-05,
-      "loss": 2.949,
-      "step": 150
-    },
-    {
-      "epoch": 0.85,
-      "eval_loss": 2.9336485862731934,
-      "eval_runtime": 312.61,
-      "eval_samples_per_second": 184.476,
-      "eval_steps_per_second": 7.687,
-      "step": 150
-    },
-    {
-      "epoch": 1.13,
-      "learning_rate": 8.870056497175142e-05,
-      "loss": 2.9548,
-      "step": 200
-    },
-    {
-      "epoch": 1.13,
-      "eval_loss": 2.925171375274658,
-      "eval_runtime": 312.2872,
-      "eval_samples_per_second": 184.667,
-      "eval_steps_per_second": 7.695,
-      "step": 200
-    },
-    {
-      "epoch": 1.41,
-      "learning_rate": 8.587570621468927e-05,
-      "loss": 2.9239,
-      "step": 250
-    },
-    {
-      "epoch": 1.41,
-      "eval_loss": 2.915585517883301,
-      "eval_runtime": 310.9982,
-      "eval_samples_per_second": 185.432,
-      "eval_steps_per_second": 7.727,
-      "step": 250
-    },
-    {
-      "epoch": 1.69,
-      "learning_rate": 8.305084745762712e-05,
-      "loss": 2.9156,
-      "step": 300
-    },
-    {
-      "epoch": 1.69,
-      "eval_loss": 2.9091334342956543,
-      "eval_runtime": 312.2088,
-      "eval_samples_per_second": 184.713,
-      "eval_steps_per_second": 7.697,
-      "step": 300
-    },
-    {
-      "epoch": 1.98,
-      "learning_rate": 8.022598870056498e-05,
-      "loss": 2.9106,
-      "step": 350
-    },
-    {
-      "epoch": 1.98,
-      "eval_loss": 2.904860019683838,
-      "eval_runtime": 311.9526,
-      "eval_samples_per_second": 184.865,
-      "eval_steps_per_second": 7.703,
-      "step": 350
-    },
-    {
-      "epoch": 2.26,
-      "learning_rate": 7.740112994350283e-05,
-      "loss": 2.9262,
-      "step": 400
-    },
-    {
-      "epoch": 2.26,
-      "eval_loss": 2.898866653442383,
-      "eval_runtime": 312.7381,
-      "eval_samples_per_second": 184.4,
-      "eval_steps_per_second": 7.684,
-      "step": 400
-    },
-    {
-      "epoch": 2.54,
-      "learning_rate": 7.457627118644068e-05,
-      "loss": 2.8997,
-      "step": 450
-    },
-    {
-      "epoch": 2.54,
-      "eval_loss": 2.8944928646087646,
-      "eval_runtime": 312.5703,
-      "eval_samples_per_second": 184.499,
-      "eval_steps_per_second": 7.688,
-      "step": 450
-    },
-    {
-      "epoch": 2.82,
-      "learning_rate": 7.175141242937854e-05,
-      "loss": 2.8892,
       "step": 500
     },
     {
-      "epoch": 2.82,
-      "eval_loss": 2.8732619285583496,
-      "eval_runtime": 314.1308,
-      "eval_samples_per_second": 183.583,
-      "eval_steps_per_second": 7.65,
       "step": 500
-    },
-    {
-      "epoch": 3.11,
-      "learning_rate": 6.892655367231638e-05,
-      "loss": 2.8935,
-      "step": 550
-    },
-    {
-      "epoch": 3.11,
-      "eval_loss": 2.8509020805358887,
-      "eval_runtime": 313.6449,
-      "eval_samples_per_second": 183.867,
-      "eval_steps_per_second": 7.662,
-      "step": 550
-    },
-    {
-      "epoch": 3.39,
-      "learning_rate": 6.610169491525424e-05,
-      "loss": 2.8514,
-      "step": 600
-    },
-    {
-      "epoch": 3.39,
-      "eval_loss": 2.824007034301758,
-      "eval_runtime": 315.311,
-      "eval_samples_per_second": 182.896,
-      "eval_steps_per_second": 7.621,
-      "step": 600
-    },
-    {
-      "epoch": 3.67,
-      "learning_rate": 6.327683615819209e-05,
-      "loss": 2.8312,
-      "step": 650
-    },
-    {
-      "epoch": 3.67,
-      "eval_loss": 2.7931814193725586,
-      "eval_runtime": 312.19,
-      "eval_samples_per_second": 184.724,
-      "eval_steps_per_second": 7.697,
-      "step": 650
-    },
-    {
-      "epoch": 3.95,
-      "learning_rate": 6.045197740112994e-05,
-      "loss": 2.8029,
-      "step": 700
-    },
-    {
-      "epoch": 3.95,
-      "eval_loss": 2.759551525115967,
-      "eval_runtime": 311.5689,
-      "eval_samples_per_second": 185.092,
-      "eval_steps_per_second": 7.713,
-      "step": 700
-    },
-    {
-      "epoch": 4.24,
-      "learning_rate": 5.76271186440678e-05,
-      "loss": 2.7972,
-      "step": 750
-    },
-    {
-      "epoch": 4.24,
-      "eval_loss": 2.7213306427001953,
-      "eval_runtime": 311.178,
-      "eval_samples_per_second": 185.325,
-      "eval_steps_per_second": 7.722,
-      "step": 750
     }
   ],
-  "max_steps": 1770,
   "num_train_epochs": 10,
-  "total_flos": 1.5298122780045043e+17,
   "trial_name": null,
   "trial_params": null
 }

 {
+  "best_metric": 6.109755516052246,
+  "best_model_checkpoint": "/home/pcjf/CESGA/works/lmodels/models/tiny/checkpoint-500",
+  "epoch": 0.4516201874223778,
+  "global_step": 500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.45,
+      "learning_rate": 9.5483288166215e-05,
+      "loss": 6.7769,
       "step": 500
     },
     {
+      "epoch": 0.45,
+      "eval_loss": 6.109755516052246,
+      "eval_runtime": 33.0039,
+      "eval_samples_per_second": 348.201,
+      "eval_steps_per_second": 43.54,
       "step": 500
     }
   ],
+  "max_steps": 11070,
   "num_train_epochs": 10,
+  "total_flos": 7979100086017440.0,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c2354b21c0eb02b167b9d6057f7fbae73d5ab7eeb327be5d088eb30bf0019608
-size 3451

 version https://git-lfs.github.com/spec/v1
+oid sha256:f76e096e9f1e6ee51628944ab73e15f97c7ed751c3b13429cf3f135d03e06e71
+size 3515

log.txt CHANGED Viewed

The diff for this file is too large to render. See raw diff

merges.txt CHANGED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d3e60aee58bb3002247500f1d529cca009a081ea94dc8ec603e656e128eb6897
 size 269468281

 version https://git-lfs.github.com/spec/v1
+oid sha256:9d0b07c5c7fc85dd0dfb66ea5fe8504c1a41a9ec2a4fb4454228c53a694d2d63
 size 269468281

runs/Jan15_21-34-13_turing/1673814853.9309754/events.out.tfevents.1673814853.turing.327173.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:83d99bd48e1e69b39e42e7e7a111f5813a2df37a546fb6bacb892b68cfcab9b8
+size 5588

runs/Jan15_21-34-13_turing/events.out.tfevents.1673814853.turing.327173.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:83a30eb94ec311a4244c985461ab9aa705cdf93050fcec6fcfa2cb9c8110aef5
+size 4006

runs/Jan15_21-38-50_turing/1673815130.6693852/events.out.tfevents.1673815130.turing.327344.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d2108c88a320146c9d7c9086b61374f2318936d1e4962ae7c1ead830c839c66e
+size 5588

runs/Jan15_21-38-50_turing/events.out.tfevents.1673815130.turing.327344.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c03b63169eea176cdba36f0a377b01059662552d65be602090a9ddc75c4988e7
+size 4006

runs/Jan15_21-44-32_turing/1673815478.7136974/events.out.tfevents.1673815478.turing.327590.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6fe18d2ad203a2fca17317161706fe1d48ff0bd3d4aa58ddd3786f66ee732e8d
+size 5614

runs/Jan15_21-44-32_turing/1673816409.4189365/events.out.tfevents.1673816409.turing.327590.3 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eedfc518d3c9ada6bc4edb1d7acdc69eea238eef562fb5983158bd98891c4f3b
+size 5614

runs/Jan15_21-44-32_turing/1673816930.061229/events.out.tfevents.1673816930.turing.327590.4 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:57f199bef9b59b52a88ac347dc0611408be16552cf1407f4e91f9abc3a603155
+size 5614

runs/Jan15_21-44-32_turing/1673817441.0883248/events.out.tfevents.1673817441.turing.327590.5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:20f47aa4ff22fa3c39e19eef3d8d7f74e15eaad70caed3426c8785c3416f7c57
+size 5614

runs/Jan15_21-44-32_turing/events.out.tfevents.1673815478.turing.327590.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c0db4d4de36b41c4986a5581bd3f70fad45bcc5a1839d9f07ffe3f2039d230f9
+size 16008

runs/Jan15_22-28-28_turing/1673818114.7901142/events.out.tfevents.1673818114.turing.328391.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d5d412669f79ed37eb2b3550ed1f61ef5e7ee18755c70f0a0f013d113466f767
+size 5617

runs/Jan15_22-28-28_turing/events.out.tfevents.1673818114.turing.328391.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:83a4f52c4d22249d42aae1a0c4d851ed9e590be0f45b8596b1978a35272eca20
+size 4030

runs/Jan15_22-47-19_turing/1673819245.5556467/events.out.tfevents.1673819245.turing.328732.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9addc809c33f1ed0e2b6e95fb5f0823429ed6463fd572186b9b8ad02a56e1161
+size 5617

runs/Jan15_22-47-19_turing/events.out.tfevents.1673819245.turing.328732.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fbdf618a68f2360da89225b17fe7026187bcdb9635d64cdf9529da8764639fa1
+size 4301

special_tokens_map.json DELETED Viewed

@@ -1,51 +0,0 @@
-{
-  "bos_token": {
-    "content": "<s>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
-  "cls_token": {
-    "content": "<s>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
-  "eos_token": {
-    "content": "</s>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
-  "mask_token": {
-    "content": "<mask>",
-    "lstrip": true,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
-  "pad_token": {
-    "content": "<pad>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
-  "sep_token": {
-    "content": "</s>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
-  "unk_token": {
-    "content": "<unk>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  }
-}

tokenizer.json DELETED Viewed

@@ -1,348 +0,0 @@
-{
-  "version": "1.0",
-  "truncation": null,
-  "padding": null,
-  "added_tokens": [
-    {
-      "id": 0,
-      "special": true,
-      "content": "<s>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": false,
-      "normalized": true
-    },
-    {
-      "id": 1,
-      "special": true,
-      "content": "<pad>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": false,
-      "normalized": true
-    },
-    {
-      "id": 2,
-      "special": true,
-      "content": "</s>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": false,
-      "normalized": true
-    },
-    {
-      "id": 3,
-      "special": true,
-      "content": "<unk>",
-      "single_word": false,
-      "lstrip": false,
-      "rstrip": false,
-      "normalized": true
-    },
-    {
-      "id": 4,
-      "special": true,
-      "content": "<mask>",
-      "single_word": false,
-      "lstrip": true,
-      "rstrip": false,
-      "normalized": true
-    }
-  ],
-  "normalizer": null,
-  "pre_tokenizer": {
-    "type": "ByteLevel",
-    "add_prefix_space": false,
-    "trim_offsets": true
-  },
-  "post_processor": {
-    "type": "RobertaProcessing",
-    "sep": [
-      "</s>",
-      2
-    ],
-    "cls": [
-      "<s>",
-      0
-    ],
-    "trim_offsets": true,
-    "add_prefix_space": false
-  },
-  "decoder": {
-    "type": "ByteLevel",
-    "add_prefix_space": true,
-    "trim_offsets": true
-  },
-  "model": {
-    "type": "BPE",
-    "dropout": null,
-    "unk_token": null,
-    "continuing_subword_prefix": "",
-    "end_of_word_suffix": "",
-    "fuse_unk": false,
-    "vocab": {
-      "<s>": 0,
-      "<pad>": 1,
-      "</s>": 2,
-      "<unk>": 3,
-      "<mask>": 4,
-      "!": 5,
-      "\"": 6,
-      "#": 7,
-      "$": 8,
-      "%": 9,
-      "&": 10,
-      "'": 11,
-      "(": 12,
-      ")": 13,
-      "*": 14,
-      "+": 15,
-      ",": 16,
-      "-": 17,
-      ".": 18,
-      "/": 19,
-      "0": 20,
-      "1": 21,
-      "2": 22,
-      "3": 23,
-      "4": 24,
-      "5": 25,
-      "6": 26,
-      "7": 27,
-      "8": 28,
-      "9": 29,
-      ":": 30,
-      ";": 31,
-      "<": 32,
-      "=": 33,
-      ">": 34,
-      "?": 35,
-      "@": 36,
-      "A": 37,
-      "B": 38,
-      "C": 39,
-      "D": 40,
-      "E": 41,
-      "F": 42,
-      "G": 43,
-      "H": 44,
-      "I": 45,
-      "J": 46,
-      "K": 47,
-      "L": 48,
-      "M": 49,
-      "N": 50,
-      "O": 51,
-      "P": 52,
-      "Q": 53,
-      "R": 54,
-      "S": 55,
-      "T": 56,
-      "U": 57,
-      "V": 58,
-      "W": 59,
-      "X": 60,
-      "Y": 61,
-      "Z": 62,
-      "[": 63,
-      "\\": 64,
-      "]": 65,
-      "^": 66,
-      "_": 67,
-      "`": 68,
-      "a": 69,
-      "b": 70,
-      "c": 71,
-      "d": 72,
-      "e": 73,
-      "f": 74,
-      "g": 75,
-      "h": 76,
-      "i": 77,
-      "j": 78,
-      "k": 79,
-      "l": 80,
-      "m": 81,
-      "n": 82,
-      "o": 83,
-      "p": 84,
-      "q": 85,
-      "r": 86,
-      "s": 87,
-      "t": 88,
-      "u": 89,
-      "v": 90,
-      "w": 91,
-      "x": 92,
-      "y": 93,
-      "z": 94,
-      "{": 95,
-      "|": 96,
-      "}": 97,
-      "~": 98,
-      "¡": 99,
-      "¢": 100,
-      "£": 101,
-      "¤": 102,
-      "¥": 103,
-      "¦": 104,
-      "§": 105,
-      "¨": 106,
-      "©": 107,
-      "ª": 108,
-      "«": 109,
-      "¬": 110,
-      "®": 111,
-      "¯": 112,
-      "°": 113,
-      "±": 114,
-      "²": 115,
-      "³": 116,
-      "´": 117,
-      "µ": 118,
-      "¶": 119,
-      "·": 120,
-      "¸": 121,
-      "¹": 122,
-      "º": 123,
-      "»": 124,
-      "¼": 125,
-      "½": 126,
-      "¾": 127,
-      "¿": 128,
-      "À": 129,
-      "Á": 130,
-      "Â": 131,
-      "Ã": 132,
-      "Ä": 133,
-      "Å": 134,
-      "Æ": 135,
-      "Ç": 136,
-      "È": 137,
-      "É": 138,
-      "Ê": 139,
-      "Ë": 140,
-      "Ì": 141,
-      "Í": 142,
-      "Î": 143,
-      "Ï": 144,
-      "Ð": 145,
-      "Ñ": 146,
-      "Ò": 147,
-      "Ó": 148,
-      "Ô": 149,
-      "Õ": 150,
-      "Ö": 151,
-      "×": 152,
-      "Ø": 153,
-      "Ù": 154,
-      "Ú": 155,
-      "Û": 156,
-      "Ü": 157,
-      "Ý": 158,
-      "Þ": 159,
-      "ß": 160,
-      "à": 161,
-      "á": 162,
-      "â": 163,
-      "ã": 164,
-      "ä": 165,
-      "å": 166,
-      "æ": 167,
-      "ç": 168,
-      "è": 169,
-      "é": 170,
-      "ê": 171,
-      "ë": 172,
-      "ì": 173,
-      "í": 174,
-      "î": 175,
-      "ï": 176,
-      "ð": 177,
-      "ñ": 178,
-      "ò": 179,
-      "ó": 180,
-      "ô": 181,
-      "õ": 182,
-      "ö": 183,
-      "÷": 184,
-      "ø": 185,
-      "ù": 186,
-      "ú": 187,
-      "û": 188,
-      "ü": 189,
-      "ý": 190,
-      "þ": 191,
-      "ÿ": 192,
-      "Ā": 193,
-      "ā": 194,
-      "Ă": 195,
-      "ă": 196,
-      "Ą": 197,
-      "ą": 198,
-      "Ć": 199,
-      "ć": 200,
-      "Ĉ": 201,
-      "ĉ": 202,
-      "Ċ": 203,
-      "ċ": 204,
-      "Č": 205,
-      "č": 206,
-      "Ď": 207,
-      "ď": 208,
-      "Đ": 209,
-      "đ": 210,
-      "Ē": 211,
-      "ē": 212,
-      "Ĕ": 213,
-      "ĕ": 214,
-      "Ė": 215,
-      "ė": 216,
-      "Ę": 217,
-      "ę": 218,
-      "Ě": 219,
-      "ě": 220,
-      "Ĝ": 221,
-      "ĝ": 222,
-      "Ğ": 223,
-      "ğ": 224,
-      "Ġ": 225,
-      "ġ": 226,
-      "Ģ": 227,
-      "ģ": 228,
-      "Ĥ": 229,
-      "ĥ": 230,
-      "Ħ": 231,
-      "ħ": 232,
-      "Ĩ": 233,
-      "ĩ": 234,
-      "Ī": 235,
-      "ī": 236,
-      "Ĭ": 237,
-      "ĭ": 238,
-      "Į": 239,
-      "į": 240,
-      "İ": 241,
-      "ı": 242,
-      "Ĳ": 243,
-      "ĳ": 244,
-      "Ĵ": 245,
-      "ĵ": 246,
-      "Ķ": 247,
-      "ķ": 248,
-      "ĸ": 249,
-      "Ĺ": 250,
-      "ĺ": 251,
-      "Ļ": 252,
-      "ļ": 253,
-      "Ľ": 254,
-      "ľ": 255,
-      "Ŀ": 256,
-      "ŀ": 257,
-      "Ł": 258,
-      "ł": 259,
-      "Ń": 260
-    },
-    "merges": []
-  }
-}

tokenizer_config.json DELETED Viewed

@@ -1,64 +0,0 @@
-{
-  "add_prefix_space": false,
-  "bos_token": {
-    "__type": "AddedToken",
-    "content": "<s>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
-  "cls_token": {
-    "__type": "AddedToken",
-    "content": "<s>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
-  "eos_token": {
-    "__type": "AddedToken",
-    "content": "</s>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
-  "errors": "replace",
-  "mask_token": {
-    "__type": "AddedToken",
-    "content": "<mask>",
-    "lstrip": true,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
-  "name_or_path": "/home/pcjf/CESGA/works/lmodels/models/tiny",
-  "pad_token": {
-    "__type": "AddedToken",
-    "content": "<pad>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
-  "sep_token": {
-    "__type": "AddedToken",
-    "content": "</s>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  },
-  "special_tokens_map_file": null,
-  "tokenizer_class": "RobertaTokenizer",
-  "trim_offsets": true,
-  "unk_token": {
-    "__type": "AddedToken",
-    "content": "<unk>",
-    "lstrip": false,
-    "normalized": true,
-    "rstrip": false,
-    "single_word": false
-  }
-}

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c2354b21c0eb02b167b9d6057f7fbae73d5ab7eeb327be5d088eb30bf0019608
-size 3451

 version https://git-lfs.github.com/spec/v1
+oid sha256:f76e096e9f1e6ee51628944ab73e15f97c7ed751c3b13429cf3f135d03e06e71
+size 3515

vocab.json CHANGED Viewed

The diff for this file is too large to render. See raw diff