umodel upload

Browse files

Files changed (9) hide show

README.md +10 -0
config.json +48 -0
model.safetensors +3 -0
special_tokens_map.json +7 -0
tokenizer.json +0 -0
tokenizer_config.json +57 -0
train_log.txt +29 -0
training_args.json +1 -0
vocab.txt +0 -0

README.md ADDED Viewed

	@@ -0,0 +1,10 @@

+## TextAttack Model Card
+            This `albert` model was fine-tuned using TextAttack. The model was fine-tuned
+            for 3 epochs with a batch size of 8,
+             a maximum sequence length of 512, and an initial learning rate of 3e-05.
+            Since this was a classification task, the model was trained with a cross-entropy loss function.
+            The best score the model achieved on this task was 0.9022, as measured by the
+            eval set accuracy, found after 3 epochs.
+            For more information, check out [TextAttack on Github](https://github.com/QData/TextAttack).

config.json ADDED Viewed

	@@ -0,0 +1,48 @@

+{
+  "_name_or_path": "uer/albert-base-chinese-cluecorpussmall",
+  "architectures": [
+    "AlbertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0,
+  "bos_token_id": 2,
+  "classifier_dropout_prob": 0.1,
+  "embedding_size": 128,
+  "eos_token_id": 3,
+  "hidden_act": "relu",
+  "hidden_dropout_prob": 0,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "Mainland China Politics",
+    "1": "HongKong Macau Politics",
+    "2": "International News",
+    "3": "Financial News",
+    "4": "Culture",
+    "5": "Entertainment",
+    "6": "Sports"
+  },
+  "initializer_range": 0.02,
+  "inner_group_num": 1,
+  "intermediate_size": 3072,
+  "label2id": {
+    "Culture": 4,
+    "Entertainment": 5,
+    "Financial News": 3,
+    "HongKong Macau Politics": 1,
+    "International News": 2,
+    "Mainland China Politics": 0,
+    "Sports": 6
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "albert",
+  "num_attention_heads": 12,
+  "num_hidden_groups": 1,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "tokenizer_class": "BertTokenizer",
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "type_vocab_size": 2,
+  "vocab_size": 21128
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9aa68fd503d3639e058a762ad15290026c256db52b8d9825ef550820f434658f
+size 42216828

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,57 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
+  "do_lower_case": false,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "never_split": null,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

train_log.txt ADDED Viewed

	@@ -0,0 +1,29 @@

+Writing logs to ./outputs/2024-03-01-08-56-39-463700/train_log.txt.
+Wrote original training args to ./outputs/2024-03-01-08-56-39-463700/training_args.json.
+***** Running training *****
+  Num examples = 50000
+  Num epochs = 3
+  Num clean epochs = 3
+  Instantaneous batch size per device = 8
+  Total train batch size (w. parallel, distributed & accumulation) = 8
+  Gradient accumulation steps = 1
+  Total optimization steps = 18750
+==========================================================
+Epoch 1
+Running clean epoch 1/3
+Train accuracy: 83.47%
+Eval accuracy: 86.99%
+Best score found. Saved model to ./outputs/2024-03-01-08-56-39-463700/best_model/
+==========================================================
+Epoch 2
+Running clean epoch 2/3
+Train accuracy: 90.54%
+Eval accuracy: 89.44%
+Best score found. Saved model to ./outputs/2024-03-01-08-56-39-463700/best_model/
+==========================================================
+Epoch 3
+Running clean epoch 3/3
+Train accuracy: 95.00%
+Eval accuracy: 90.22%
+Best score found. Saved model to ./outputs/2024-03-01-08-56-39-463700/best_model/
+Wrote README to ./outputs/2024-03-01-08-56-39-463700/README.md.

training_args.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"num_epochs": 3, "num_clean_epochs": 1, "attack_epoch_interval": 1, "early_stopping_epochs": null, "learning_rate": 3e-05, "num_warmup_steps": 500, "weight_decay": 0.01, "per_device_train_batch_size": 8, "per_device_eval_batch_size": 32, "gradient_accumulation_steps": 1, "random_seed": 718, "parallel": false, "load_best_model_at_end": false, "alpha": 1.0, "num_train_adv_examples": -1, "query_budget_train": null, "attack_num_workers_per_device": 1, "output_dir": "./outputs/2024-03-01-08-56-39-463700", "checkpoint_interval_steps": null, "checkpoint_interval_epochs": null, "save_last": true, "log_to_tb": false, "tb_log_dir": null, "log_to_wandb": false, "wandb_project": "textattack", "logging_interval_step": 1}

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff