alexmy2023 commited on Sep 13

Commit

eb331e4

•

1 Parent(s): 634c105

Training in progress, epoch 1

Browse files

Files changed (25) hide show

model.safetensors +1 -1
run-6/checkpoint-214/config.json +25 -0
run-6/checkpoint-214/model.safetensors +3 -0
run-6/checkpoint-214/optimizer.pt +3 -0
run-6/checkpoint-214/rng_state.pth +3 -0
run-6/checkpoint-214/scheduler.pt +3 -0
run-6/checkpoint-214/special_tokens_map.json +7 -0
run-6/checkpoint-214/tokenizer.json +0 -0
run-6/checkpoint-214/tokenizer_config.json +55 -0
run-6/checkpoint-214/trainer_state.json +56 -0
run-6/checkpoint-214/training_args.bin +3 -0
run-6/checkpoint-214/vocab.txt +0 -0
run-7/checkpoint-27/config.json +25 -0
run-7/checkpoint-27/model.safetensors +3 -0
run-7/checkpoint-27/optimizer.pt +3 -0
run-7/checkpoint-27/rng_state.pth +3 -0
run-7/checkpoint-27/scheduler.pt +3 -0
run-7/checkpoint-27/special_tokens_map.json +7 -0
run-7/checkpoint-27/tokenizer.json +0 -0
run-7/checkpoint-27/tokenizer_config.json +55 -0
run-7/checkpoint-27/trainer_state.json +47 -0
run-7/checkpoint-27/training_args.bin +3 -0
run-7/checkpoint-27/vocab.txt +0 -0
runs/Sep12_22-09-35_MiWiFi-RB06-srv/events.out.tfevents.1726202938.MiWiFi-RB06-srv.162912.9 +3 -0
training_args.bin +1 -1

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7cfad3114e04d1cd4db5951505cee6c40d891dc09ef4e2ce780fcabf2124e8a7
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:9c8765857d50a8b830fb8079aaa684b5f8fd01b10b10cc759929fff742ecb6c3
 size 267832560

run-6/checkpoint-214/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "vocab_size": 30522
+}

run-6/checkpoint-214/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:47b0923dc07ceaaa891a8577ec8dbcfc7b960a61c30544c7b7ef4ec041278cb7
+size 267832560

run-6/checkpoint-214/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:012fe11f482b8e10b25227bb7592f2f0c4356a5c3954c68d8b163949c648236f
+size 535727290

run-6/checkpoint-214/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b1d377e90cb9f666f33b7d17fd2b4689527e86f671e315325b2eed0c9756f96e
+size 14244

run-6/checkpoint-214/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9e350f154195773c074e2903b3f324bbe9859b67ad2cebc0e691dddae738a653
+size 1064

run-6/checkpoint-214/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-214/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-214/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-214/trainer_state.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "best_metric": 0.3335704872121122,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-6/checkpoint-214",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 214,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5775482058525085,
+      "eval_matthews_correlation": 0.0463559874942472,
+      "eval_runtime": 2.8107,
+      "eval_samples_per_second": 371.088,
+      "eval_steps_per_second": 23.482,
+      "step": 107
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.794565737247467,
+      "eval_matthews_correlation": 0.3335704872121122,
+      "eval_runtime": 2.7588,
+      "eval_samples_per_second": 378.059,
+      "eval_steps_per_second": 23.923,
+      "step": 214
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 214,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 2,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 6.095042624468598e-05,
+    "num_train_epochs": 2,
+    "per_device_train_batch_size": 8,
+    "seed": 4
+  }
+}

run-6/checkpoint-214/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6b9468710e0720e1ad5cfb9f727a3d9da01565426671f831bd38db2e1c2d3960
+size 5240

run-6/checkpoint-214/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-7/checkpoint-27/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "vocab_size": 30522
+}

run-7/checkpoint-27/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9c8765857d50a8b830fb8079aaa684b5f8fd01b10b10cc759929fff742ecb6c3
+size 267832560

run-7/checkpoint-27/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ce3a466181067f76100a3c2cef56f367a390083fdbbf256926dfe2cb093ee3fb
+size 535727290

run-7/checkpoint-27/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:be3ce56c68c604afead4d0188f4a7ac8b4808fd673397ba7b2fc9bf31be6c263
+size 14308

run-7/checkpoint-27/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a545ce26c2f8bfe185f7c6b18bc31dd9e0fe200b2c1eccaedeff762f27b64312
+size 1064

run-7/checkpoint-27/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-7/checkpoint-27/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-7/checkpoint-27/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-7/checkpoint-27/trainer_state.json ADDED Viewed

	@@ -0,0 +1,47 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-7/checkpoint-27",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 27,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.588252067565918,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 2.8049,
+      "eval_samples_per_second": 371.854,
+      "eval_steps_per_second": 23.531,
+      "step": 27
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 135,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 3.524526356230851e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 29
+  }
+}

run-7/checkpoint-27/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b0fa037da5e44e87e909c4a83b8a1e92ddf86f003e3d99a528befa77b42c32bb
+size 5240

run-7/checkpoint-27/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

runs/Sep12_22-09-35_MiWiFi-RB06-srv/events.out.tfevents.1726202938.MiWiFi-RB06-srv.162912.9 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5cf44d91f5fb542dad02ed41f629106ccb8d95cc62d46b279e3f4efbffd7246
+size 5545

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6b9468710e0720e1ad5cfb9f727a3d9da01565426671f831bd38db2e1c2d3960
 size 5240

 version https://git-lfs.github.com/spec/v1
+oid sha256:b0fa037da5e44e87e909c4a83b8a1e92ddf86f003e3d99a528befa77b42c32bb
 size 5240