End of training

Browse files

Files changed (11) hide show

last-checkpoint/config.json +0 -36
last-checkpoint/optimizer.pt +0 -3
last-checkpoint/pytorch_model.bin +0 -3
last-checkpoint/rng_state.pth +0 -3
last-checkpoint/scheduler.pt +0 -3
last-checkpoint/special_tokens_map.json +0 -7
last-checkpoint/tokenizer.json +0 -0
last-checkpoint/tokenizer_config.json +0 -17
last-checkpoint/trainer_state.json +0 -70
last-checkpoint/training_args.bin +0 -3
last-checkpoint/vocab.txt +0 -0

last-checkpoint/config.json DELETED Viewed

@@ -1,36 +0,0 @@
-{
-  "_name_or_path": "distilbert-base-multilingual-cased",
-  "activation": "gelu",
-  "architectures": [
-    "DistilBertForSequenceClassification"
-  ],
-  "attention_dropout": 0.1,
-  "dim": 768,
-  "dropout": 0.1,
-  "hidden_dim": 3072,
-  "id2label": {
-    "0": "P",
-    "1": "NEU",
-    "2": "N"
-  },
-  "initializer_range": 0.02,
-  "label2id": {
-    "N": 2,
-    "NEU": 1,
-    "P": 0
-  },
-  "max_position_embeddings": 512,
-  "model_type": "distilbert",
-  "n_heads": 12,
-  "n_layers": 6,
-  "output_past": true,
-  "pad_token_id": 0,
-  "problem_type": "single_label_classification",
-  "qa_dropout": 0.1,
-  "seq_classif_dropout": 0.2,
-  "sinusoidal_pos_embds": false,
-  "tie_weights_": true,
-  "torch_dtype": "float32",
-  "transformers_version": "4.26.0",
-  "vocab_size": 119547
-}

last-checkpoint/optimizer.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:51fd547909c744d1c4427d66de36e3da2a3eef333d9d98213f32cb483df359cb
-size 1082673861

last-checkpoint/pytorch_model.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:b90e9d5cf032cd13e38686460511c96592b104a58afb73f03db6edd676e10203
-size 541341997

last-checkpoint/rng_state.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:fa76fe52fd649c3885f94de74fa828974782e09ea5a116494bafe08931499b21
-size 13553

last-checkpoint/scheduler.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:aa65b58ab89e6113985723068f5721b82cd7855ba30b3811b50b5d914c50e528
-size 627

last-checkpoint/special_tokens_map.json DELETED Viewed

@@ -1,7 +0,0 @@
-{
-  "cls_token": "[CLS]",
-  "mask_token": "[MASK]",
-  "pad_token": "[PAD]",
-  "sep_token": "[SEP]",
-  "unk_token": "[UNK]"
-}

last-checkpoint/tokenizer.json DELETED Viewed

The diff for this file is too large to render. See raw diff

last-checkpoint/tokenizer_config.json DELETED Viewed

@@ -1,17 +0,0 @@
-{
-  "cls_token": "[CLS]",
-  "do_lower_case": false,
-  "mask_token": "[MASK]",
-  "max_length": 72,
-  "model_max_length": 512,
-  "name_or_path": "distilbert-base-multilingual-cased",
-  "pad_token": "[PAD]",
-  "padding": "max_length",
-  "sep_token": "[SEP]",
-  "special_tokens_map_file": null,
-  "strip_accents": null,
-  "tokenize_chinese_chars": true,
-  "tokenizer_class": "DistilBertTokenizer",
-  "truncation": true,
-  "unk_token": "[UNK]"
-}

last-checkpoint/trainer_state.json DELETED Viewed

@@ -1,70 +0,0 @@
-{
-  "best_metric": 0.6149801744869822,
-  "best_model_checkpoint": "/Users/fperez/dev/data/spanishclassfier_exp/distilbert-base-multilingual-cased-finetuned-with-spanish-tweets-clf/ep_4-lr_5e-5-msl_72-bs_8/checkpoint-1629",
-  "epoch": 3.0,
-  "global_step": 1629,
-  "is_hyper_param_search": false,
-  "is_local_process_zero": true,
-  "is_world_process_zero": true,
-  "log_history": [
-    {
-      "epoch": 1.0,
-      "learning_rate": 3.7500000000000003e-05,
-      "loss": 1.0168,
-      "step": 543
-    },
-    {
-      "epoch": 1.0,
-      "eval_accuracy": 0.5563234277816171,
-      "eval_f1": 0.501215296189785,
-      "eval_loss": 0.9144431948661804,
-      "eval_precision": 0.5239741651933573,
-      "eval_recall": 0.5251116933847957,
-      "eval_runtime": 45.1011,
-      "eval_samples_per_second": 32.083,
-      "eval_steps_per_second": 1.02,
-      "step": 543
-    },
-    {
-      "epoch": 2.0,
-      "learning_rate": 2.5e-05,
-      "loss": 0.8197,
-      "step": 1086
-    },
-    {
-      "epoch": 2.0,
-      "eval_accuracy": 0.5763648928818245,
-      "eval_f1": 0.5475887277260436,
-      "eval_loss": 0.9133076667785645,
-      "eval_precision": 0.5814651407100622,
-      "eval_recall": 0.5462449051052606,
-      "eval_runtime": 53.0684,
-      "eval_samples_per_second": 27.267,
-      "eval_steps_per_second": 0.867,
-      "step": 1086
-    },
-    {
-      "epoch": 3.0,
-      "learning_rate": 1.25e-05,
-      "loss": 0.5574,
-      "step": 1629
-    },
-    {
-      "epoch": 3.0,
-      "eval_accuracy": 0.6150656530753282,
-      "eval_f1": 0.6149801744869822,
-      "eval_loss": 1.0629427433013916,
-      "eval_precision": 0.6227137668982091,
-      "eval_recall": 0.6112054453996908,
-      "eval_runtime": 42.6747,
-      "eval_samples_per_second": 33.908,
-      "eval_steps_per_second": 1.078,
-      "step": 1629
-    }
-  ],
-  "max_steps": 2172,
-  "num_train_epochs": 4,
-  "total_flos": 242543853074880.0,
-  "trial_name": null,
-  "trial_params": null
-}

last-checkpoint/training_args.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:01afbf37abe3c2d7822792a145a2b3731dedacdc0796249d6a564f36c186545d
-size 3835

last-checkpoint/vocab.txt DELETED Viewed

The diff for this file is too large to render. See raw diff