Training in progress, step 500, checkpoint

Files changed (10) hide show

last-checkpoint/config.json CHANGED Viewed

@@ -33,7 +33,7 @@
     }
   },
   "torch_dtype": "float32",
-  "transformers_version": "4.44.2",
   "use_cache": true,
   "vocab_size": 50257
 }

     }
   },
   "torch_dtype": "float32",
+  "transformers_version": "4.45.1",
   "use_cache": true,
   "vocab_size": 50257
 }

last-checkpoint/generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 50256,
   "eos_token_id": 50256,
-  "transformers_version": "4.44.2"
 }

   "_from_model_config": true,
   "bos_token_id": 50256,
   "eos_token_id": 50256,
+  "transformers_version": "4.45.1"
 }

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:667bd867027c05d4d7a383ca3cbe77566f0c87e0df9f990aa2c6c361c8e48103
 size 497774208

 version https://git-lfs.github.com/spec/v1
+oid sha256:b94725bfe1566204e151e7f0a68c6d8f245e564efd51c476821b0e42ee6aa397
 size 497774208

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8a8be1024915d9580d9be98c81eda66e51670b80f40a6c63430fac51ad14d2f5
 size 995642298

 version https://git-lfs.github.com/spec/v1
+oid sha256:9d58a2d63fddfe8d8ac69da051cc41641ffbc97c9c0c4ede54cc429e48b9db0a
 size 995642298

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7783ce2b510ebff845afe5faa16d30b45d77fba542f3b0068e3d921d737af067
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:3006c2e62f2fbd7c9faf809b9b2f9bdfb8379c432374b893703883a883751cd7
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a628550ca4465bdd919b150d3c25a5f39f8c2d8ec727e285ab3a8278b2af9fa2
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:4f2c546c6ee20d93648539b1268fb91629fbdbed1298c7ecff35599c084d635f
 size 1064

last-checkpoint/tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

last-checkpoint/tokenizer_config.json CHANGED Viewed

@@ -19,7 +19,7 @@
     }
   },
   "bos_token": "<|endoftext|>",
-  "clean_up_tokenization_spaces": true,
   "eos_token": "<|endoftext|>",
   "model_max_length": 1024,
   "pad_token": "[PAD]",

     }
   },
   "bos_token": "<|endoftext|>",
+  "clean_up_tokenization_spaces": false,
   "eos_token": "<|endoftext|>",
   "model_max_length": 1024,
   "pad_token": "[PAD]",

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,15 +1,15 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.46513023646621054,
   "eval_steps": 500,
-  "global_step": 15500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [],
-  "logging_steps": 33323,
-  "max_steps": 99972,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 3,
   "save_steps": 500,
@@ -25,7 +25,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 3.2400211968e+16,
   "train_batch_size": 32,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.029865010154103453,
   "eval_steps": 500,
+  "global_step": 500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [],
+  "logging_steps": 16741,
+  "max_steps": 50226,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 3,
   "save_steps": 500,
       "attributes": {}
     }
   },
+  "total_flos": 1045168128000000.0,
   "train_batch_size": 32,
   "trial_name": null,
   "trial_params": null

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:588ed685f39e84528f61e069ba254fd7cef9c5061f838bf59aba9ee692ef1d72
 size 5240

 version https://git-lfs.github.com/spec/v1
+oid sha256:c823122689f046e65538558e9b41096b25fc0852caa1598fec53aa2a8a9e23c8
 size 5240