Pratye commited on Jun 14, 2023

Commit

c14531f

1 Parent(s): d8267c5

Added Model

Browse files

Files changed (28) hide show

.DS_Store +0 -0
checkpoint-2400/config.json +31 -0
checkpoint-2400/generation_config.json +7 -0
checkpoint-2400/merges.txt +0 -0
checkpoint-2400/optimizer.pt +3 -0
checkpoint-2400/pytorch_model.bin +3 -0
checkpoint-2400/rng_state_0.pth +3 -0
checkpoint-2400/rng_state_1.pth +3 -0
checkpoint-2400/scheduler.pt +3 -0
checkpoint-2400/special_tokens_map.json +30 -0
checkpoint-2400/tokenizer_config.json +41 -0
checkpoint-2400/trainer_state.json +0 -0
checkpoint-2400/training_args.bin +3 -0
checkpoint-2400/vocab.json +0 -0
config.json +31 -0
generation_config.json +7 -0
merges.txt +0 -0
pytorch_model.bin +3 -0
runs/.DS_Store +0 -0
runs/Jun14_18-02-25_c6f551d7fa07/1686765879.4060984/events.out.tfevents.1686765879.c6f551d7fa07.136.1 +3 -0
runs/Jun14_18-02-25_c6f551d7fa07/events.out.tfevents.1686765879.c6f551d7fa07.136.0 +3 -0
runs/Jun14_18-06-21_c6f551d7fa07/1686766157.3914363/events.out.tfevents.1686766157.c6f551d7fa07.218.1 +3 -0
runs/Jun14_18-06-21_c6f551d7fa07/events.out.tfevents.1686766157.c6f551d7fa07.218.0 +3 -0
special_tokens_map.json +30 -0
tokenizer_config.json +41 -0
trainer_state.json +0 -0
training_args.bin +3 -0
vocab.json +0 -0

.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

checkpoint-2400/config.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+  "_name_or_path": "facebook/opt-350m",
+  "_remove_final_layer_norm": false,
+  "activation_dropout": 0.0,
+  "activation_function": "relu",
+  "architectures": [
+    "OPTForCausalLM"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 2,
+  "do_layer_norm_before": false,
+  "dropout": 0.1,
+  "enable_bias": true,
+  "eos_token_id": 2,
+  "ffn_dim": 4096,
+  "hidden_size": 1024,
+  "init_std": 0.02,
+  "layer_norm_elementwise_affine": true,
+  "layerdrop": 0.0,
+  "max_position_embeddings": 2048,
+  "model_type": "opt",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "pad_token_id": 1,
+  "prefix": "</s>",
+  "torch_dtype": "float32",
+  "transformers_version": "4.29.2",
+  "use_cache": true,
+  "vocab_size": 50265,
+  "word_embed_proj_dim": 512
+}

checkpoint-2400/generation_config.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 2,
+  "eos_token_id": 2,
+  "pad_token_id": 1,
+  "transformers_version": "4.29.2"
+}

checkpoint-2400/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-2400/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7f735452a877c51a28f6b32a1e7f4ed087c09bf68582d5184b1294449faf1f4c
+size 2649787397

checkpoint-2400/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0fef194959356bc9fef2fbf5777c2cce858a32a58e35f16f10e682d5684ebdff
+size 1427854113

checkpoint-2400/rng_state_0.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c34a050aa9cf91490146d6c41a69a5d18e058c61cab6c266953b3676ccb7b71f
+size 15607

checkpoint-2400/rng_state_1.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:df14e931706e56a0d9fc58f4bf0e147333df38b875931d956e87541f373b3585
+size 15607

checkpoint-2400/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:29ad1293b45ff480e438a30a4bbc83945434aa6c5fe88988e2ab4877dc35ad46
+size 627

checkpoint-2400/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "bos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<pad>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

checkpoint-2400/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,41 @@

+{
+  "add_bos_token": true,
+  "add_prefix_space": false,
+  "bos_token": {
+    "__type": "AddedToken",
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "clean_up_tokenization_spaces": true,
+  "eos_token": {
+    "__type": "AddedToken",
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "errors": "replace",
+  "model_max_length": 512,
+  "pad_token": {
+    "__type": "AddedToken",
+    "content": "<pad>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "padding_side": "right",
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": {
+    "__type": "AddedToken",
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

checkpoint-2400/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-2400/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3f7b6970f7487ddbe266a78385418ea5da6f6078a40a2a6ad7934f05c77b081e
+size 4091

checkpoint-2400/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

config.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+  "_name_or_path": "facebook/opt-350m",
+  "_remove_final_layer_norm": false,
+  "activation_dropout": 0.0,
+  "activation_function": "relu",
+  "architectures": [
+    "OPTForCausalLM"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 2,
+  "do_layer_norm_before": false,
+  "dropout": 0.1,
+  "enable_bias": true,
+  "eos_token_id": 2,
+  "ffn_dim": 4096,
+  "hidden_size": 1024,
+  "init_std": 0.02,
+  "layer_norm_elementwise_affine": true,
+  "layerdrop": 0.0,
+  "max_position_embeddings": 2048,
+  "model_type": "opt",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
+  "pad_token_id": 1,
+  "prefix": "</s>",
+  "torch_dtype": "float32",
+  "transformers_version": "4.29.2",
+  "use_cache": true,
+  "vocab_size": 50265,
+  "word_embed_proj_dim": 512
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 2,
+  "eos_token_id": 2,
+  "pad_token_id": 1,
+  "transformers_version": "4.29.2"
+}

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5f9615771b630825d88082144897971ce024f23499a3613f2436d4131556e1d9
+size 1427854113

runs/.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

runs/Jun14_18-02-25_c6f551d7fa07/1686765879.4060984/events.out.tfevents.1686765879.c6f551d7fa07.136.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6a943dd7720fdc64c87ade64c7eb99263685847c6b7be2361001277f3f51acc6
+size 6100

runs/Jun14_18-02-25_c6f551d7fa07/events.out.tfevents.1686765879.c6f551d7fa07.136.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:05c92a863db33083b383333b494af4ab0846e3bd8b82e02c34a219243f9b4f39
+size 11994

runs/Jun14_18-06-21_c6f551d7fa07/1686766157.3914363/events.out.tfevents.1686766157.c6f551d7fa07.218.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c505fda6f131780f88c631743845e7cebdc44142d94ce8f4cc8e54988a96c006
+size 6100

runs/Jun14_18-06-21_c6f551d7fa07/events.out.tfevents.1686766157.c6f551d7fa07.218.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5886b54b04efc5a556ef75d16bc55bf8ac462e2c6917d53a0d49249c4f051096
+size 386719

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "bos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<pad>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,41 @@

+{
+  "add_bos_token": true,
+  "add_prefix_space": false,
+  "bos_token": {
+    "__type": "AddedToken",
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "clean_up_tokenization_spaces": true,
+  "eos_token": {
+    "__type": "AddedToken",
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "errors": "replace",
+  "model_max_length": 512,
+  "pad_token": {
+    "__type": "AddedToken",
+    "content": "<pad>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "padding_side": "right",
+  "tokenizer_class": "GPT2Tokenizer",
+  "unk_token": {
+    "__type": "AddedToken",
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3f7b6970f7487ddbe266a78385418ea5da6f6078a40a2a6ad7934f05c77b081e
+size 4091

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff