Upload 10 files

Files changed (6) hide show

added_tokens.json CHANGED Viewed

	@@ -1 +1 @@
1	- {"<~~SEP~~>": ~~28998~~, "<~~BOS~~>": ~~28996~~, "<PAD>": 28999, "<EOS>": 28997}


1	+ {"<BOS>": 28996, "<SEP>": 28998, "<PAD>": 28999, "<EOS>": 28997}

eval_results_mlm.txt CHANGED Viewed

	@@ -1 +1 @@
1	- perplexity = 11.~~000638008243978~~


1	+ perplexity = 47.5140214816094

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b1af4f0f3524fa8ffd0f6083132bed8a0309bba8f0e4104cfdc66e47101a6ca5
-size 1334625496

 version https://git-lfs.github.com/spec/v1
+oid sha256:f2fbf5dab4a15412f879cef823c7c4640ff99951eadbf6f65cfd3e3376e18a82
+size 1334625493

train_results.txt CHANGED Viewed

@@ -1,11 +1,11 @@
-epoch = 5.0
-init_mem_cpu_alloc_delta = 1159303168
-init_mem_cpu_peaked_delta = 916664320
 init_mem_gpu_alloc_delta = 1335215616
 init_mem_gpu_peaked_delta = 0
-train_mem_cpu_alloc_delta = 29356032
-train_mem_cpu_peaked_delta = 0
 train_mem_gpu_alloc_delta = 4003456000
 train_mem_gpu_peaked_delta = 19106743296
-train_runtime = 393.5719
-train_samples_per_second = 0.978

+epoch = 10.0
+init_mem_cpu_alloc_delta = 1168576512
+init_mem_cpu_peaked_delta = 1323925504
 init_mem_gpu_alloc_delta = 1335215616
 init_mem_gpu_peaked_delta = 0
+train_mem_cpu_alloc_delta = 54071296
+train_mem_cpu_peaked_delta = 356077568
 train_mem_gpu_alloc_delta = 4003456000
 train_mem_gpu_peaked_delta = 19106743296
+train_runtime = 980.3735
+train_samples_per_second = 0.785

trainer_state.json CHANGED Viewed

@@ -1,23 +1,29 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 5.0,
-  "global_step": 385,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 5.0,
-      "step": 385,
-      "total_flos": 3141206509117440.0,
-      "train_runtime": 393.5719,
-      "train_samples_per_second": 0.978
     }
   ],
-  "max_steps": 385,
-  "num_train_epochs": 5,
-  "total_flos": 3141206509117440.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 10.0,
+  "global_step": 770,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 6.49,
+      "learning_rate": 3.506493506493507e-08,
+      "loss": 4.2363,
+      "step": 500
+    },
+    {
+      "epoch": 10.0,
+      "step": 770,
+      "total_flos": 6282413018234880.0,
+      "train_runtime": 980.3735,
+      "train_samples_per_second": 0.785
     }
   ],
+  "max_steps": 770,
+  "num_train_epochs": 10,
+  "total_flos": 6282413018234880.0,
   "trial_name": null,
   "trial_params": null
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0d6747927314afef61a048408044c8503515955e00c6d9c7bf4bd12f66916167
-size 2351

 version https://git-lfs.github.com/spec/v1
+oid sha256:e4d1f848dbe017c8469705d9ef92d62e3ed52b8479d6f13ba39a024dac0c5229
+size 2415