Training in progress, epoch 1

Files changed (14) hide show

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0c84327d2f34d0aabb099e33ec19322ae4e3b524037c27c164a5849098c07c6a
 size 98470112

 version https://git-lfs.github.com/spec/v1
+oid sha256:cd5711eb9721b26e2bbad9e20f9b1cd4ad333964a88ee9c070880583c612eb5e
 size 98470112

run-3/checkpoint-27/config.json ADDED Viewed

+{
+  "_name_or_path": "google/mobilebert-uncased",
+  "architectures": [
+    "MobileBertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_activation": false,
+  "classifier_dropout": null,
+  "embedding_size": 128,
+  "hidden_act": "relu",
+  "hidden_dropout_prob": 0.0,
+  "hidden_size": 512,
+  "initializer_range": 0.02,
+  "intermediate_size": 512,
+  "intra_bottleneck_size": 128,
+  "key_query_shared_bottleneck": true,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "mobilebert",
+  "normalization_type": "no_norm",
+  "num_attention_heads": 4,
+  "num_feedforward_networks": 4,
+  "num_hidden_layers": 24,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "trigram_input": true,
+  "true_hidden_size": 128,
+  "type_vocab_size": 2,
+  "use_bottleneck": true,
+  "use_bottleneck_attention": false,
+  "vocab_size": 30522
+}

run-3/checkpoint-27/model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:cd5711eb9721b26e2bbad9e20f9b1cd4ad333964a88ee9c070880583c612eb5e
+size 98470112

run-3/checkpoint-27/optimizer.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a811ad900e2b1c0eb1245cc2573173081e1f5f6a27c34b2d9d3fd28ec0e03bfa
+size 197593757

run-3/checkpoint-27/rng_state.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:eee7002acb07e4bcc4284d55442289e7e7b48e2654ec232e01365d6ba36cc233
+size 14308

run-3/checkpoint-27/scheduler.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:b0de8e5fdf9f959a0c55c5a4e97ac0a40ec5d7f02acfdb63c0726aeaa91688ff
+size 1064

run-3/checkpoint-27/special_tokens_map.json ADDED Viewed

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-27/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-27/tokenizer_config.json ADDED Viewed

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "MobileBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-27/trainer_state.json ADDED Viewed

+{
+  "best_metric": 0.00286100001416597,
+  "best_model_checkpoint": "mobilebert-uncased-finetuned-cola/run-3/checkpoint-27",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 27,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.7651640176773071,
+      "eval_matthews_correlation": 0.00286100001416597,
+      "eval_runtime": 2.6861,
+      "eval_samples_per_second": 388.297,
+      "eval_steps_per_second": 24.571,
+      "step": 27
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 135,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 7.240804873707743e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 26
+  }
+}

run-3/checkpoint-27/training_args.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:36785e41a5c6212d878c92ad6ba2710c2bfea93bb0742241dc2ee9d2b361a3a8
+size 4920

run-3/checkpoint-27/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

runs/Mar07_08-06-39_49d4a3166cad/events.out.tfevents.1709800099.49d4a3166cad.3288.7 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a58d773a6e0a714d6a1bfddbe54e73f1986cef21a3886394099e3b28b547dc06
+size 5534

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a0926346707a8d66976e74089ae692911018b9e10991497cdb1023e38ec538cc
 size 4920

 version https://git-lfs.github.com/spec/v1
+oid sha256:36785e41a5c6212d878c92ad6ba2710c2bfea93bb0742241dc2ee9d2b361a3a8
 size 4920