imda-lseokmin commited on May 28

Commit

717255d

•

1 Parent(s): 8b4cc20

Upload 159 files

Browse files

Updated with removed input and responses

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

README.md +3 -3
all_results.json +12 -12
checkpoint-1000/config.json +39 -0
checkpoint-1000/generation_config.json +6 -0
checkpoint-1000/merges.txt +0 -0
checkpoint-1000/model.safetensors +3 -0
checkpoint-1000/optimizer.pt +3 -0
checkpoint-1000/rng_state.pth +3 -0
checkpoint-1000/scheduler.pt +3 -0
checkpoint-1000/special_tokens_map.json +5 -0
checkpoint-1000/tokenizer.json +0 -0
checkpoint-1000/tokenizer_config.json +19 -0
checkpoint-1000/trainer_state.json +35 -0
checkpoint-1000/training_args.bin +3 -0
checkpoint-1000/vocab.json +0 -0
checkpoint-1500/config.json +39 -0
checkpoint-1500/generation_config.json +6 -0
checkpoint-1500/merges.txt +0 -0
checkpoint-1500/model.safetensors +3 -0
checkpoint-1500/optimizer.pt +3 -0
checkpoint-1500/rng_state.pth +3 -0
checkpoint-1500/scheduler.pt +3 -0
checkpoint-1500/special_tokens_map.json +5 -0
checkpoint-1500/tokenizer.json +0 -0
checkpoint-1500/tokenizer_config.json +19 -0
checkpoint-1500/trainer_state.json +42 -0
checkpoint-1500/training_args.bin +3 -0
checkpoint-1500/vocab.json +0 -0
checkpoint-2000/config.json +39 -0
checkpoint-2000/generation_config.json +6 -0
checkpoint-2000/merges.txt +0 -0
checkpoint-2000/model.safetensors +3 -0
checkpoint-2000/optimizer.pt +3 -0
checkpoint-2000/rng_state.pth +3 -0
checkpoint-2000/scheduler.pt +3 -0
checkpoint-2000/special_tokens_map.json +5 -0
checkpoint-2000/tokenizer.json +0 -0
checkpoint-2000/tokenizer_config.json +19 -0
checkpoint-2000/trainer_state.json +49 -0
checkpoint-2000/training_args.bin +3 -0
checkpoint-2000/vocab.json +0 -0
checkpoint-2500/config.json +39 -0
checkpoint-2500/generation_config.json +6 -0
checkpoint-2500/merges.txt +0 -0
checkpoint-2500/model.safetensors +3 -0
checkpoint-2500/optimizer.pt +3 -0
checkpoint-2500/rng_state.pth +3 -0
checkpoint-2500/scheduler.pt +3 -0
checkpoint-2500/special_tokens_map.json +5 -0
checkpoint-2500/tokenizer.json +0 -0

README.md CHANGED Viewed

@@ -17,8 +17,8 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [gpt2](https://huggingface.co/gpt2) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 3.3880
-- Accuracy: 0.4552
 ## Model description
@@ -43,7 +43,7 @@ The following hyperparameters were used during training:
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
-- num_epochs: 40.0
 ### Training results

 This model is a fine-tuned version of [gpt2](https://huggingface.co/gpt2) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 2.5745
+- Accuracy: 0.4842
 ## Model description
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
+- num_epochs: 20.0
 ### Training results

all_results.json CHANGED Viewed

@@ -1,16 +1,16 @@
 {
-    "epoch": 40.0,
-    "eval_accuracy": 0.4551971326164875,
-    "eval_loss": 3.3879826068878174,
-    "eval_runtime": 0.6202,
     "eval_samples": 9,
-    "eval_samples_per_second": 14.512,
-    "eval_steps_per_second": 8.062,
-    "perplexity": 29.606164710375456,
-    "total_flos": 2884664033280000.0,
-    "train_loss": 1.075979393115942,
-    "train_runtime": 1098.0309,
     "train_samples": 138,
-    "train_samples_per_second": 5.027,
-    "train_steps_per_second": 2.514
 }

 {
+    "epoch": 20.0,
+    "eval_accuracy": 0.4841968067774519,
+    "eval_loss": 2.5744614601135254,
+    "eval_runtime": 0.6172,
     "eval_samples": 9,
+    "eval_samples_per_second": 14.581,
+    "eval_steps_per_second": 8.101,
+    "perplexity": 13.124247324302939,
+    "total_flos": 1442332016640000.0,
+    "train_loss": 1.6038585939269134,
+    "train_runtime": 546.7087,
     "train_samples": 138,
+    "train_samples_per_second": 5.048,
+    "train_steps_per_second": 2.524
 }

checkpoint-1000/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_name_or_path": "gpt2",
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPT2LMHeadModel"
+  ],
+  "attn_pdrop": 0.1,
+  "bos_token_id": 50256,
+  "embd_pdrop": 0.1,
+  "eos_token_id": 50256,
+  "initializer_range": 0.02,
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "gpt2",
+  "n_ctx": 1024,
+  "n_embd": 768,
+  "n_head": 12,
+  "n_inner": null,
+  "n_layer": 12,
+  "n_positions": 1024,
+  "reorder_and_upcast_attn": false,
+  "resid_pdrop": 0.1,
+  "scale_attn_by_inverse_layer_idx": false,
+  "scale_attn_weights": true,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "task_specific_params": {
+    "text-generation": {
+      "do_sample": true,
+      "max_length": 50
+    }
+  },
+  "torch_dtype": "float32",
+  "transformers_version": "4.40.1",
+  "use_cache": true,
+  "vocab_size": 50257
+}

checkpoint-1000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 50256,
+  "eos_token_id": 50256,
+  "transformers_version": "4.40.1"
+}

checkpoint-1000/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-1000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f0a3045c4618f75a91e43e2b4079b4f70ddfea71b549212fe00c8bc207fce25d
+size 497774208

checkpoint-1000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a5737a324483690f9aadd907a2e48f602e54024c812e42d2a6c0c28878d67400
+size 995642298

checkpoint-1000/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fad09794a0db580c98cf06d0ebd5b66e92d3f86f4f7bd4a728e24f1a05467f0c
+size 14244

checkpoint-1000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7e4ac6e2694cbb9ef21cdf8af6f8d76becd952779eb03e00001aef172a063804
+size 1064

checkpoint-1000/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "bos_token": "<|endoftext|>",
+  "eos_token": "<|endoftext|>",
+  "unk_token": "<|endoftext|>"
+}

checkpoint-1000/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-1000/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,19 @@

+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "50256": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<|endoftext|>",
+  "clean_up_tokenization_spaces": true,
+  "eos_token": "<|endoftext|>",
+  "model_max_length": 1024,
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": "<|endoftext|>"
+}

checkpoint-1000/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 14.492753623188406,
+  "eval_steps": 500,
+  "global_step": 1000,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 7.246376811594203,
+      "grad_norm": 4.941216468811035,
+      "learning_rate": 3.188405797101449e-05,
+      "loss": 1.9657,
+      "step": 500
+    },
+    {
+      "epoch": 14.492753623188406,
+      "grad_norm": 4.604403495788574,
+      "learning_rate": 1.3768115942028985e-05,
+      "loss": 1.4853,
+      "step": 1000
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 1380,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 20,
+  "save_steps": 500,
+  "total_flos": 1045168128000000.0,
+  "train_batch_size": 2,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-1000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d74f83bec7ea349d722f90da656054543e87196b485a7f973f3b2bf816599956
+size 4984

checkpoint-1000/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-1500/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_name_or_path": "gpt2",
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPT2LMHeadModel"
+  ],
+  "attn_pdrop": 0.1,
+  "bos_token_id": 50256,
+  "embd_pdrop": 0.1,
+  "eos_token_id": 50256,
+  "initializer_range": 0.02,
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "gpt2",
+  "n_ctx": 1024,
+  "n_embd": 768,
+  "n_head": 12,
+  "n_inner": null,
+  "n_layer": 12,
+  "n_positions": 1024,
+  "reorder_and_upcast_attn": false,
+  "resid_pdrop": 0.1,
+  "scale_attn_by_inverse_layer_idx": false,
+  "scale_attn_weights": true,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "task_specific_params": {
+    "text-generation": {
+      "do_sample": true,
+      "max_length": 50
+    }
+  },
+  "torch_dtype": "float32",
+  "transformers_version": "4.40.1",
+  "use_cache": true,
+  "vocab_size": 50257
+}

checkpoint-1500/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 50256,
+  "eos_token_id": 50256,
+  "transformers_version": "4.40.1"
+}

checkpoint-1500/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-1500/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9465c3d5498a14eff4afc1070fc554233f943e6eba2aabfc88b7074c1546d081
+size 497774208

checkpoint-1500/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c260c3ea63415ce78c5ae5ffd403f9bb6e66bdd2d545964a6113f9907db3557f
+size 995642298

checkpoint-1500/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7a5d0dc6dc976ddb0996d36c9a11fc601fadb39a823112e10d55371b69bb60c8
+size 14244

checkpoint-1500/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:63d73ead489afb0c384edd6841da8cd61a5e9ac39008a9decfd3938022882349
+size 1064

checkpoint-1500/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "bos_token": "<|endoftext|>",
+  "eos_token": "<|endoftext|>",
+  "unk_token": "<|endoftext|>"
+}

checkpoint-1500/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-1500/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,19 @@

+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "50256": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<|endoftext|>",
+  "clean_up_tokenization_spaces": true,
+  "eos_token": "<|endoftext|>",
+  "model_max_length": 1024,
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": "<|endoftext|>"
+}

checkpoint-1500/trainer_state.json ADDED Viewed

	@@ -0,0 +1,42 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 26.31578947368421,
+  "eval_steps": 500,
+  "global_step": 1500,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 8.771929824561404,
+      "grad_norm": 5.547207832336426,
+      "learning_rate": 3.9035087719298244e-05,
+      "loss": 2.3503,
+      "step": 500
+    },
+    {
+      "epoch": 17.54385964912281,
+      "grad_norm": 4.723608493804932,
+      "learning_rate": 2.8070175438596492e-05,
+      "loss": 1.6049,
+      "step": 1000
+    },
+    {
+      "epoch": 26.31578947368421,
+      "grad_norm": 3.2716429233551025,
+      "learning_rate": 1.7105263157894737e-05,
+      "loss": 1.1304,
+      "step": 1500
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 2280,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 40,
+  "save_steps": 500,
+  "total_flos": 1554165006336000.0,
+  "train_batch_size": 2,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-1500/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:13b85d5955db3439393fdb946be63666175d55f4cd4ea26dedcc342dbcf5fbf3
+size 4984

checkpoint-1500/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-2000/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_name_or_path": "gpt2",
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPT2LMHeadModel"
+  ],
+  "attn_pdrop": 0.1,
+  "bos_token_id": 50256,
+  "embd_pdrop": 0.1,
+  "eos_token_id": 50256,
+  "initializer_range": 0.02,
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "gpt2",
+  "n_ctx": 1024,
+  "n_embd": 768,
+  "n_head": 12,
+  "n_inner": null,
+  "n_layer": 12,
+  "n_positions": 1024,
+  "reorder_and_upcast_attn": false,
+  "resid_pdrop": 0.1,
+  "scale_attn_by_inverse_layer_idx": false,
+  "scale_attn_weights": true,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "task_specific_params": {
+    "text-generation": {
+      "do_sample": true,
+      "max_length": 50
+    }
+  },
+  "torch_dtype": "float32",
+  "transformers_version": "4.40.1",
+  "use_cache": true,
+  "vocab_size": 50257
+}

checkpoint-2000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 50256,
+  "eos_token_id": 50256,
+  "transformers_version": "4.40.1"
+}

checkpoint-2000/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-2000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cd7e17c6af9f22cfa4ca7a3119ecd8bd5541e2d28313decc3f3afe309eb5261e
+size 497774208

checkpoint-2000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f82ecb38a4f52683fa6de7cfdee42793f9bf75dd744b4ab6a417438c6a5a4a07
+size 995642298

checkpoint-2000/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a068e9171b43c381b4d97aa1db231465651c89decc2318271a0ef4e4f10c63e9
+size 14244

checkpoint-2000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:76ee29c7de4f93a78f39f2e05dadcee1556b60097ebe2743779eed6c51359032
+size 1064

checkpoint-2000/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "bos_token": "<|endoftext|>",
+  "eos_token": "<|endoftext|>",
+  "unk_token": "<|endoftext|>"
+}

checkpoint-2000/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-2000/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,19 @@

+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "50256": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<|endoftext|>",
+  "clean_up_tokenization_spaces": true,
+  "eos_token": "<|endoftext|>",
+  "model_max_length": 1024,
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": "<|endoftext|>"
+}

checkpoint-2000/trainer_state.json ADDED Viewed

	@@ -0,0 +1,49 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 35.08771929824562,
+  "eval_steps": 500,
+  "global_step": 2000,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 8.771929824561404,
+      "grad_norm": 5.547207832336426,
+      "learning_rate": 3.9035087719298244e-05,
+      "loss": 2.3503,
+      "step": 500
+    },
+    {
+      "epoch": 17.54385964912281,
+      "grad_norm": 4.723608493804932,
+      "learning_rate": 2.8070175438596492e-05,
+      "loss": 1.6049,
+      "step": 1000
+    },
+    {
+      "epoch": 26.31578947368421,
+      "grad_norm": 3.2716429233551025,
+      "learning_rate": 1.7105263157894737e-05,
+      "loss": 1.1304,
+      "step": 1500
+    },
+    {
+      "epoch": 35.08771929824562,
+      "grad_norm": 3.1184732913970947,
+      "learning_rate": 6.140350877192982e-06,
+      "loss": 0.8743,
+      "step": 2000
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 2280,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 40,
+  "save_steps": 500,
+  "total_flos": 2072045813760000.0,
+  "train_batch_size": 2,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-2000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:13b85d5955db3439393fdb946be63666175d55f4cd4ea26dedcc342dbcf5fbf3
+size 4984

checkpoint-2000/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-2500/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_name_or_path": "gpt2",
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPT2LMHeadModel"
+  ],
+  "attn_pdrop": 0.1,
+  "bos_token_id": 50256,
+  "embd_pdrop": 0.1,
+  "eos_token_id": 50256,
+  "initializer_range": 0.02,
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "gpt2",
+  "n_ctx": 1024,
+  "n_embd": 768,
+  "n_head": 12,
+  "n_inner": null,
+  "n_layer": 12,
+  "n_positions": 1024,
+  "reorder_and_upcast_attn": false,
+  "resid_pdrop": 0.1,
+  "scale_attn_by_inverse_layer_idx": false,
+  "scale_attn_weights": true,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "task_specific_params": {
+    "text-generation": {
+      "do_sample": true,
+      "max_length": 50
+    }
+  },
+  "torch_dtype": "float32",
+  "transformers_version": "4.40.1",
+  "use_cache": true,
+  "vocab_size": 50257
+}

checkpoint-2500/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 50256,
+  "eos_token_id": 50256,
+  "transformers_version": "4.40.1"
+}

checkpoint-2500/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-2500/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b1f8b8fcba4ccf815d73ea20b625c2f4e5815fa47ef8064cf23ea3087a38b496
+size 497774208

checkpoint-2500/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8ef47719544b224a26bf342e7ed9be404d3369ec46e3b5db4c0075336fcba9cd
+size 995642298

checkpoint-2500/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1a5aac99db29c70e1aaad7d1c648f0ec39b61bb7344d6cd77050012b5653176f
+size 14244

checkpoint-2500/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:da29dc3e59527e7abe6c76b3ac8afc3b60d6f976044939cf19f47b9a0849a321
+size 1064

checkpoint-2500/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "bos_token": "<|endoftext|>",
+  "eos_token": "<|endoftext|>",
+  "unk_token": "<|endoftext|>"
+}

checkpoint-2500/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff