LiYuan199701 commited on Apr 30, 2022

Commit

2e7055a

•

1 Parent(s): e8bb525

upload weights and configurations

Browse files

Files changed (34) hide show

checkpoint-1080/config.json +49 -0
checkpoint-1080/optimizer.pt +3 -0
checkpoint-1080/pytorch_model.bin +3 -0
checkpoint-1080/rng_state.pth +3 -0
checkpoint-1080/scheduler.pt +3 -0
checkpoint-1080/special_tokens_map.json +1 -0
checkpoint-1080/tokenizer.json +0 -0
checkpoint-1080/tokenizer_config.json +1 -0
checkpoint-1080/trainer_state.json +37 -0
checkpoint-1080/training_args.bin +3 -0
checkpoint-1080/vocab.txt +0 -0
checkpoint-2160/config.json +49 -0
checkpoint-2160/optimizer.pt +3 -0
checkpoint-2160/pytorch_model.bin +3 -0
checkpoint-2160/rng_state.pth +3 -0
checkpoint-2160/scheduler.pt +3 -0
checkpoint-2160/special_tokens_map.json +1 -0
checkpoint-2160/tokenizer.json +0 -0
checkpoint-2160/tokenizer_config.json +1 -0
checkpoint-2160/trainer_state.json +58 -0
checkpoint-2160/training_args.bin +3 -0
checkpoint-2160/vocab.txt +0 -0
config.json +49 -0
pytorch_model.bin +3 -0
runs/Apr29_23-50-37_90c6c7951fd7/1651276280.2593992/events.out.tfevents.1651276280.90c6c7951fd7.96.1 +3 -0
runs/Apr29_23-50-37_90c6c7951fd7/events.out.tfevents.1651276280.90c6c7951fd7.96.0 +3 -0
runs/Apr30_14-54-10_40d99a3c6b31/1651330485.541449/events.out.tfevents.1651330485.40d99a3c6b31.98.1 +3 -0
runs/Apr30_14-54-10_40d99a3c6b31/events.out.tfevents.1651330485.40d99a3c6b31.98.0 +3 -0
runs/Apr30_14-54-10_40d99a3c6b31/events.out.tfevents.1651331923.40d99a3c6b31.98.2 +3 -0
special_tokens_map.json +1 -0
tokenizer.json +0 -0
tokenizer_config.json +1 -0
training_args.bin +3 -0
vocab.txt +0 -0

checkpoint-1080/config.json ADDED Viewed

	@@ -0,0 +1,49 @@

+{
+  "_name_or_path": "nlptown/bert-base-multilingual-uncased-sentiment",
+  "_num_labels": 5,
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "directionality": "bidi",
+  "finetuning_task": "sentiment-analysis",
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1 star",
+    "1": "2 stars",
+    "2": "3 stars",
+    "3": "4 stars",
+    "4": "5 stars"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1 star": 0,
+    "2 stars": 1,
+    "3 stars": 2,
+    "4 stars": 3,
+    "5 stars": 4
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 0,
+  "pooler_fc_size": 768,
+  "pooler_num_attention_heads": 12,
+  "pooler_num_fc_layers": 3,
+  "pooler_size_per_head": 128,
+  "pooler_type": "first_token_transform",
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.18.0",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 105879
+}

checkpoint-1080/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5483221cea18aa6de41aad0179f8d3639b193757287ecb620b0d0962caacd0f
+size 1338998557

checkpoint-1080/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d5dbec41d1a8bb6943bfccdc268b25cb8cfca9218a794bd66244da86b909f10c
+size 669512045

checkpoint-1080/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:36c64416ff24aaf168258056af653e4fb212255ee02bd64a9c0a63d5817db3ce
+size 14503

checkpoint-1080/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3fc0488cc14ab27ea111af8628fc6d1eb243481639112bdd9bea753f481d2716
+size 623

checkpoint-1080/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}

checkpoint-1080/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-1080/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "max_len": 512, "special_tokens_map_file": "/root/.cache/huggingface/transformers/ed85e7bfaa7dfcf9924004400478a6426fcab28d3e427960549371a1729115d1.dd8bd9bfd3664b530ea4e645105f557769387b3da9f79bdb55ed556bdd80611d", "name_or_path": "nlptown/bert-base-multilingual-uncased-sentiment", "do_basic_tokenize": true, "never_split": null, "tokenizer_class": "BertTokenizer"}

checkpoint-1080/trainer_state.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "best_metric": 0.8,
+  "best_model_checkpoint": "bert-base-multilingual-uncased-sentiment-finetuned-mnli/checkpoint-1080",
+  "epoch": 1.0,
+  "global_step": 1080,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.46,
+      "learning_rate": 1.537037037037037e-05,
+      "loss": 0.5815,
+      "step": 500
+    },
+    {
+      "epoch": 0.93,
+      "learning_rate": 1.0740740740740742e-05,
+      "loss": 0.5554,
+      "step": 1000
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.8,
+      "eval_loss": 0.5202942490577698,
+      "eval_runtime": 45.5353,
+      "eval_samples_per_second": 94.872,
+      "eval_steps_per_second": 5.929,
+      "step": 1080
+    }
+  ],
+  "max_steps": 2160,
+  "num_train_epochs": 2,
+  "total_flos": 4546681501777920.0,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-1080/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e7229c590222fc9bc9efd03e17e51ee9a5ac1f46d4c1b2c02aaa6a19d0653824
+size 3119

checkpoint-1080/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-2160/config.json ADDED Viewed

	@@ -0,0 +1,49 @@

+{
+  "_name_or_path": "nlptown/bert-base-multilingual-uncased-sentiment",
+  "_num_labels": 5,
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "directionality": "bidi",
+  "finetuning_task": "sentiment-analysis",
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1 star",
+    "1": "2 stars",
+    "2": "3 stars",
+    "3": "4 stars",
+    "4": "5 stars"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1 star": 0,
+    "2 stars": 1,
+    "3 stars": 2,
+    "4 stars": 3,
+    "5 stars": 4
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 0,
+  "pooler_fc_size": 768,
+  "pooler_num_attention_heads": 12,
+  "pooler_num_fc_layers": 3,
+  "pooler_size_per_head": 128,
+  "pooler_type": "first_token_transform",
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.18.0",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 105879
+}

checkpoint-2160/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:adba7bc0adbc850fb8b9fedf8305638552e091c1eaeff34ac7a5c6802eb306d0
+size 1338998557

checkpoint-2160/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8b44ae25e8c5905075afe489329dbca4231a3cf926aac518dea11636d71c428a
+size 669512045

checkpoint-2160/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d62ec236a22ba8d1c9d31a15b4ee302471376c83244b18e7aab5dc50edf0e01
+size 14503

checkpoint-2160/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8284f52720d68b59a8f5f98069ef36ec78484714c6591a584d0ad6025ead74d3
+size 623

checkpoint-2160/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}

checkpoint-2160/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-2160/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1 @@

checkpoint-2160/trainer_state.json ADDED Viewed

	@@ -0,0 +1,58 @@

+{
+  "best_metric": 0.8,
+  "best_model_checkpoint": "bert-base-multilingual-uncased-sentiment-finetuned-mnli/checkpoint-1080",
+  "epoch": 2.0,
+  "global_step": 2160,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.46,
+      "learning_rate": 1.537037037037037e-05,
+      "loss": 0.5815,
+      "step": 500
+    },
+    {
+      "epoch": 0.93,
+      "learning_rate": 1.0740740740740742e-05,
+      "loss": 0.5554,
+      "step": 1000
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.8,
+      "eval_loss": 0.5202942490577698,
+      "eval_runtime": 45.5353,
+      "eval_samples_per_second": 94.872,
+      "eval_steps_per_second": 5.929,
+      "step": 1080
+    },
+    {
+      "epoch": 1.39,
+      "learning_rate": 6.111111111111112e-06,
+      "loss": 0.4584,
+      "step": 1500
+    },
+    {
+      "epoch": 1.85,
+      "learning_rate": 1.4814814814814815e-06,
+      "loss": 0.4243,
+      "step": 2000
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.7983796296296296,
+      "eval_loss": 0.549648642539978,
+      "eval_runtime": 45.476,
+      "eval_samples_per_second": 94.995,
+      "eval_steps_per_second": 5.937,
+      "step": 2160
+    }
+  ],
+  "max_steps": 2160,
+  "num_train_epochs": 2,
+  "total_flos": 9093363003555840.0,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-2160/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e7229c590222fc9bc9efd03e17e51ee9a5ac1f46d4c1b2c02aaa6a19d0653824
+size 3119

checkpoint-2160/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

config.json ADDED Viewed

	@@ -0,0 +1,49 @@

+{
+  "_name_or_path": "nlptown/bert-base-multilingual-uncased-sentiment",
+  "_num_labels": 5,
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "directionality": "bidi",
+  "finetuning_task": "sentiment-analysis",
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1 star",
+    "1": "2 stars",
+    "2": "3 stars",
+    "3": "4 stars",
+    "4": "5 stars"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1 star": 0,
+    "2 stars": 1,
+    "3 stars": 2,
+    "4 stars": 3,
+    "5 stars": 4
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 0,
+  "pooler_fc_size": 768,
+  "pooler_num_attention_heads": 12,
+  "pooler_num_fc_layers": 3,
+  "pooler_size_per_head": 128,
+  "pooler_type": "first_token_transform",
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.18.0",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 105879
+}

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d5dbec41d1a8bb6943bfccdc268b25cb8cfca9218a794bd66244da86b909f10c
+size 669512045

runs/Apr29_23-50-37_90c6c7951fd7/1651276280.2593992/events.out.tfevents.1651276280.90c6c7951fd7.96.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0351b9919f4d0bb1fe85a67b7d0a9f11be79efc2a96cb170ed0f46736461398a
+size 4958

runs/Apr29_23-50-37_90c6c7951fd7/events.out.tfevents.1651276280.90c6c7951fd7.96.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:69e75c5fe5ece6bcf9058ee65c5095685ba066fc1271e0a75943533e3ed0e946
+size 3969

runs/Apr30_14-54-10_40d99a3c6b31/1651330485.541449/events.out.tfevents.1651330485.40d99a3c6b31.98.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5a6819c57d78a5ddcdc945fa67e363baebb5e581f526e5a43c5ff8315506fdf8
+size 4958

runs/Apr30_14-54-10_40d99a3c6b31/events.out.tfevents.1651330485.40d99a3c6b31.98.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8fcab47017d421d7549c97d796991a6acde4546107c06151ea9b94439404b453
+size 5597

runs/Apr30_14-54-10_40d99a3c6b31/events.out.tfevents.1651331923.40d99a3c6b31.98.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:10931744be69022e3f157456c1d11083cd640e28d822849f018646c207ca42d4
+size 363

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1 @@

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e7229c590222fc9bc9efd03e17e51ee9a5ac1f46d4c1b2c02aaa6a19d0653824
+size 3119

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff