SungmoKim commited on Mar 28, 2024

Commit

e1946ac

verified ·

1 Parent(s): 68068f9

Upload folder using huggingface_hub

Browse files

Files changed (24) hide show

.gitattributes +2 -0
README.md +37 -0
autotrain-data/dataset_dict.json +1 -0
autotrain-data/train/data-00000-of-00001.arrow +3 -0
autotrain-data/train/dataset_info.json +0 -0
autotrain-data/train/state.json +16 -0
autotrain-data/validation/data-00000-of-00001.arrow +3 -0
autotrain-data/validation/dataset_info.json +0 -0
autotrain-data/validation/state.json +16 -0
checkpoint-20424/config.json +3 -0
checkpoint-20424/model.safetensors +3 -0
checkpoint-20424/optimizer.pt +3 -0
checkpoint-20424/rng_state.pth +3 -0
checkpoint-20424/scheduler.pt +3 -0
checkpoint-20424/trainer_state.json +180 -0
checkpoint-20424/training_args.bin +3 -0
config.json +3 -0
model.safetensors +3 -0
special_tokens_map.json +7 -0
tokenizer.json +0 -0
tokenizer_config.json +55 -0
training_args.bin +3 -0
training_params.json +30 -0
vocab.txt +0 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+checkpoint-20424/config.json filter=lfs diff=lfs merge=lfs -text
+config.json filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,37 @@

+---
+tags:
+- autotrain
+- text-classification
+widget:
+- text: "I love AutoTrain"
+datasets:
+- bert-multilingual-uncased-seoul-mapo/autotrain-data
+---
+# Model Trained Using AutoTrain
+- Problem type: Text Classification
+## Validation Metrics
+loss: 10.881439208984375
+f1_macro: 2.0884651199784053e-09
+f1_micro: 5.5086301872934264e-05
+f1_weighted: 6.068667007649333e-09
+precision_macro: 1.0442900828992278e-09
+precision_micro: 5.5086301872934264e-05
+precision_weighted: 3.034500654036041e-09
+recall_macro: 1.895734597156398e-05
+recall_micro: 5.5086301872934264e-05
+recall_weighted: 5.5086301872934264e-05
+accuracy: 5.5086301872934264e-05

autotrain-data/dataset_dict.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"splits": ["train", "validation"]}

autotrain-data/train/data-00000-of-00001.arrow ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8b76d5a1aa24ea9542c3754f1d4457dbbbb0d6e58cc79aa13e0cce907141d8ab
+size 8271144

autotrain-data/train/dataset_info.json ADDED Viewed

The diff for this file is too large to render. See raw diff

autotrain-data/train/state.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "_data_files": [
+    {
+      "filename": "data-00000-of-00001.arrow"
+    }
+  ],
+  "_fingerprint": "569b8763400540ba",
+  "_format_columns": [
+    "autotrain_text",
+    "autotrain_label"
+  ],
+  "_format_kwargs": {},
+  "_format_type": null,
+  "_output_all_columns": false,
+  "_split": null
+}

autotrain-data/validation/data-00000-of-00001.arrow ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8b76d5a1aa24ea9542c3754f1d4457dbbbb0d6e58cc79aa13e0cce907141d8ab
+size 8271144

autotrain-data/validation/dataset_info.json ADDED Viewed

The diff for this file is too large to render. See raw diff

autotrain-data/validation/state.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "_data_files": [
+    {
+      "filename": "data-00000-of-00001.arrow"
+    }
+  ],
+  "_fingerprint": "569b8763400540ba",
+  "_format_columns": [
+    "autotrain_text",
+    "autotrain_label"
+  ],
+  "_format_kwargs": {},
+  "_format_type": null,
+  "_output_all_columns": false,
+  "_split": null
+}

checkpoint-20424/config.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:30bf199832255bf22ab2f4c359bfb505214667765c744ee2cd9a8e1f5770a2ea
+size 10683194

checkpoint-20424/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:68360b3d50798a2eac1a70f0600a4febac2f251cfc9afba03590c2a6ae28dea8
+size 831708216

checkpoint-20424/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4409deed287097e9e83339f6758b5bf548d3dd87bd9d47c065ceab8c57e4e469
+size 1663537402

checkpoint-20424/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:549cd76df73cadda6b6fc09b8c61f4b8d765a08797ab0e520843b2d26cb59430
+size 14244

checkpoint-20424/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ad99518938fa647ab0b4173e6e8716de2d3b659f55fd1664b87aaf18be688e2d
+size 1064

checkpoint-20424/trainer_state.json ADDED Viewed

	@@ -0,0 +1,180 @@

+{
+  "best_metric": 10.881439208984375,
+  "best_model_checkpoint": "bert-multilingual-uncased-seoul-mapo\\checkpoint-20424",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 20424,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.2,
+      "grad_norm": 4.823001861572266,
+      "learning_rate": 3.3186490455212925e-05,
+      "loss": 10.8897,
+      "step": 1361
+    },
+    {
+      "epoch": 0.4,
+      "grad_norm": 10.075815200805664,
+      "learning_rate": 4.816658506066047e-05,
+      "loss": 10.9188,
+      "step": 2722
+    },
+    {
+      "epoch": 0.6,
+      "grad_norm": 9.569664001464844,
+      "learning_rate": 4.446439257929384e-05,
+      "loss": 10.9979,
+      "step": 4083
+    },
+    {
+      "epoch": 0.8,
+      "grad_norm": 8.838366508483887,
+      "learning_rate": 4.076220009792721e-05,
+      "loss": 11.0794,
+      "step": 5444
+    },
+    {
+      "epoch": 1.0,
+      "grad_norm": 9.55294418334961,
+      "learning_rate": 3.706000761656058e-05,
+      "loss": 11.0159,
+      "step": 6805
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 1.8362100624311422e-05,
+      "eval_f1_macro": 6.961806052611587e-10,
+      "eval_f1_micro": 1.8362100624311422e-05,
+      "eval_f1_weighted": 6.743210967228447e-10,
+      "eval_loss": 10.912298202514648,
+      "eval_precision_macro": 3.480966942997426e-10,
+      "eval_precision_micro": 1.8362100624311422e-05,
+      "eval_precision_weighted": 3.371667393373379e-10,
+      "eval_recall_macro": 1.895734597156398e-05,
+      "eval_recall_micro": 1.8362100624311422e-05,
+      "eval_recall_weighted": 1.8362100624311422e-05,
+      "eval_runtime": 5760.3648,
+      "eval_samples_per_second": 9.454,
+      "eval_steps_per_second": 0.591,
+      "step": 6808
+    },
+    {
+      "epoch": 1.2,
+      "grad_norm": 4.205029010772705,
+      "learning_rate": 3.3357815135193955e-05,
+      "loss": 10.918,
+      "step": 8166
+    },
+    {
+      "epoch": 1.4,
+      "grad_norm": 5.503857135772705,
+      "learning_rate": 2.9655622653827325e-05,
+      "loss": 10.907,
+      "step": 9527
+    },
+    {
+      "epoch": 1.6,
+      "grad_norm": 4.5869550704956055,
+      "learning_rate": 2.5953430172460695e-05,
+      "loss": 10.8973,
+      "step": 10888
+    },
+    {
+      "epoch": 1.8,
+      "grad_norm": 8.75169849395752,
+      "learning_rate": 2.2251237691094066e-05,
+      "loss": 10.896,
+      "step": 12249
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 8.687349319458008,
+      "learning_rate": 1.8549045209727436e-05,
+      "loss": 10.9367,
+      "step": 13610
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.0006426735218508997,
+      "eval_f1_macro": 2.435111878171352e-08,
+      "eval_f1_micro": 0.0006426735218508997,
+      "eval_f1_weighted": 8.255279664109179e-07,
+      "eval_loss": 10.890863418579102,
+      "eval_precision_macro": 1.218338430049099e-08,
+      "eval_precision_micro": 0.0006426735218508997,
+      "eval_precision_weighted": 4.1302925568823887e-07,
+      "eval_recall_macro": 1.895734597156398e-05,
+      "eval_recall_micro": 0.0006426735218508997,
+      "eval_recall_weighted": 0.0006426735218508997,
+      "eval_runtime": 229.7364,
+      "eval_samples_per_second": 237.054,
+      "eval_steps_per_second": 14.817,
+      "step": 13616
+    },
+    {
+      "epoch": 2.2,
+      "grad_norm": 5.189822673797607,
+      "learning_rate": 1.4846852728360808e-05,
+      "loss": 10.9037,
+      "step": 14971
+    },
+    {
+      "epoch": 2.4,
+      "grad_norm": 4.2194414138793945,
+      "learning_rate": 1.1147380447200914e-05,
+      "loss": 10.8914,
+      "step": 16332
+    },
+    {
+      "epoch": 2.6,
+      "grad_norm": 3.2576804161071777,
+      "learning_rate": 7.445187965834286e-06,
+      "loss": 10.8939,
+      "step": 17693
+    },
+    {
+      "epoch": 2.8,
+      "grad_norm": 3.3207333087921143,
+      "learning_rate": 3.7457156846743925e-06,
+      "loss": 10.8859,
+      "step": 19054
+    },
+    {
+      "epoch": 3.0,
+      "grad_norm": 4.7934651374816895,
+      "learning_rate": 5.440400413470432e-08,
+      "loss": 10.8979,
+      "step": 20415
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 5.5086301872934264e-05,
+      "eval_f1_macro": 2.0884651199784053e-09,
+      "eval_f1_micro": 5.5086301872934264e-05,
+      "eval_f1_weighted": 6.068667007649333e-09,
+      "eval_loss": 10.881439208984375,
+      "eval_precision_macro": 1.0442900828992278e-09,
+      "eval_precision_micro": 5.5086301872934264e-05,
+      "eval_precision_weighted": 3.034500654036041e-09,
+      "eval_recall_macro": 1.895734597156398e-05,
+      "eval_recall_micro": 5.5086301872934264e-05,
+      "eval_recall_weighted": 5.5086301872934264e-05,
+      "eval_runtime": 229.8136,
+      "eval_samples_per_second": 236.975,
+      "eval_steps_per_second": 14.812,
+      "step": 20424
+    }
+  ],
+  "logging_steps": 1361,
+  "max_steps": 20424,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "total_flos": 1.583647415497728e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-20424/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:af067aa29cb53eba11342b2bbe220c7f4c9480b4c431468bf3f6d0bb25b0641c
+size 4984

config.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:30bf199832255bf22ab2f4c359bfb505214667765c744ee2cd9a8e1f5770a2ea
+size 10683194

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:68360b3d50798a2eac1a70f0600a4febac2f251cfc9afba03590c2a6ae28dea8
+size 831708216

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:af067aa29cb53eba11342b2bbe220c7f4c9480b4c431468bf3f6d0bb25b0641c
+size 4984

training_params.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+    "data_path": "bert-multilingual-uncased-seoul-mapo/autotrain-data",
+    "model": "google-bert/bert-base-multilingual-uncased",
+    "lr": 5e-05,
+    "epochs": 3,
+    "max_seq_length": 128,
+    "batch_size": 8,
+    "warmup_ratio": 0.1,
+    "gradient_accumulation": 1,
+    "optimizer": "adamw_torch",
+    "scheduler": "linear",
+    "weight_decay": 0.0,
+    "max_grad_norm": 1.0,
+    "seed": 42,
+    "train_split": "train",
+    "valid_split": "validation",
+    "text_column": "autotrain_text",
+    "target_column": "autotrain_label",
+    "logging_steps": -1,
+    "project_name": "bert-multilingual-uncased-seoul-mapo",
+    "auto_find_batch_size": false,
+    "mixed_precision": "fp16",
+    "save_total_limit": 1,
+    "save_strategy": "epoch",
+    "push_to_hub": true,
+    "repo_id": "SungmoKim/bert-multilingual-uncased-seoul-mapo",
+    "evaluation_strategy": "epoch",
+    "username": "SungmoKim",
+    "log": "none"
+}

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff