model upload

Files changed (9) hide show

README.md +10 -0
config.json +31 -0
model.safetensors +3 -0
special_tokens_map.json +7 -0
tokenizer.json +0 -0
tokenizer_config.json +55 -0
train_log.txt +39 -0
training_args.json +1 -0
vocab.txt +0 -0

README.md ADDED Viewed

	@@ -0,0 +1,10 @@

+## TextAttack Model Card
+            This `bert` model was fine-tuned using TextAttack. The model was fine-tuned
+            for 5 epochs with a batch size of 8,
+             a maximum sequence length of 512, and an initial learning rate of 3e-05.
+            Since this was a classification task, the model was trained with a cross-entropy loss function.
+            The best score the model achieved on this task was 0.9466666666666667, as measured by the
+            eval set accuracy, found after 3 epochs.
+            For more information, check out [TextAttack on Github](https://github.com/QData/TextAttack).

config.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+  "_name_or_path": "bert-base-chinese",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "directionality": "bidi",
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "pooler_fc_size": 768,
+  "pooler_num_attention_heads": 12,
+  "pooler_num_fc_layers": 3,
+  "pooler_size_per_head": 128,
+  "pooler_type": "first_token_transform",
+  "position_embedding_type": "absolute",
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 21128
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee139e7d8fd966a11632b623124d5c2f63de8a657918524bef18e2cb8bbec066
+size 409100240

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": false,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

train_log.txt ADDED Viewed

	@@ -0,0 +1,39 @@

+Writing logs to ./outputs/2024-02-28-10-23-08-068616/train_log.txt.
+Wrote original training args to ./outputs/2024-02-28-10-23-08-068616/training_args.json.
+***** Running training *****
+  Num examples = 9600
+  Num epochs = 5
+  Num clean epochs = 5
+  Instantaneous batch size per device = 8
+  Total train batch size (w. parallel, distributed & accumulation) = 8
+  Gradient accumulation steps = 1
+  Total optimization steps = 6000
+==========================================================
+Epoch 1
+Running clean epoch 1/5
+Train accuracy: 88.40%
+Eval accuracy: 91.67%
+Best score found. Saved model to ./outputs/2024-02-28-10-23-08-068616/best_model/
+==========================================================
+Epoch 2
+Running clean epoch 2/5
+Train accuracy: 94.80%
+Eval accuracy: 93.67%
+Best score found. Saved model to ./outputs/2024-02-28-10-23-08-068616/best_model/
+==========================================================
+Epoch 3
+Running clean epoch 3/5
+Train accuracy: 97.62%
+Eval accuracy: 94.67%
+Best score found. Saved model to ./outputs/2024-02-28-10-23-08-068616/best_model/
+==========================================================
+Epoch 4
+Running clean epoch 4/5
+Train accuracy: 98.95%
+Eval accuracy: 94.33%
+==========================================================
+Epoch 5
+Running clean epoch 5/5
+Train accuracy: 99.34%
+Eval accuracy: 94.58%
+Wrote README to ./outputs/2024-02-28-10-23-08-068616/README.md.

training_args.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"num_epochs": 5, "num_clean_epochs": 1, "attack_epoch_interval": 1, "early_stopping_epochs": null, "learning_rate": 3e-05, "num_warmup_steps": 500, "weight_decay": 0.01, "per_device_train_batch_size": 8, "per_device_eval_batch_size": 32, "gradient_accumulation_steps": 1, "random_seed": 718, "parallel": false, "load_best_model_at_end": false, "alpha": 1.0, "num_train_adv_examples": -1, "query_budget_train": null, "attack_num_workers_per_device": 1, "output_dir": "./outputs/2024-02-28-10-23-08-068616", "checkpoint_interval_steps": null, "checkpoint_interval_epochs": null, "save_last": true, "log_to_tb": false, "tb_log_dir": null, "log_to_wandb": false, "wandb_project": "textattack", "logging_interval_step": 1}

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff