anamelchor commited on Feb 27, 2024

Commit

eb78cad

•

1 Parent(s): 65d303f

Training in progress, epoch 1

Browse files

Files changed (39) hide show

model.safetensors +1 -1
run-6/checkpoint-27/config.json +25 -0
run-6/checkpoint-27/model.safetensors +3 -0
run-6/checkpoint-27/optimizer.pt +3 -0
run-6/checkpoint-27/rng_state.pth +3 -0
run-6/checkpoint-27/scheduler.pt +3 -0
run-6/checkpoint-27/special_tokens_map.json +7 -0
run-6/checkpoint-27/tokenizer.json +0 -0
run-6/checkpoint-27/tokenizer_config.json +55 -0
run-6/checkpoint-27/trainer_state.json +35 -0
run-6/checkpoint-27/training_args.bin +3 -0
run-6/checkpoint-27/vocab.txt +0 -0
run-8/checkpoint-14/config.json +25 -0
run-8/checkpoint-14/model.safetensors +3 -0
run-8/checkpoint-14/optimizer.pt +3 -0
run-8/checkpoint-14/rng_state.pth +3 -0
run-8/checkpoint-14/scheduler.pt +3 -0
run-8/checkpoint-14/special_tokens_map.json +7 -0
run-8/checkpoint-14/tokenizer.json +0 -0
run-8/checkpoint-14/tokenizer_config.json +55 -0
run-8/checkpoint-14/trainer_state.json +35 -0
run-8/checkpoint-14/training_args.bin +3 -0
run-8/checkpoint-14/vocab.txt +0 -0
run-8/checkpoint-28/config.json +25 -0
run-8/checkpoint-28/model.safetensors +3 -0
run-8/checkpoint-28/optimizer.pt +3 -0
run-8/checkpoint-28/rng_state.pth +3 -0
run-8/checkpoint-28/scheduler.pt +3 -0
run-8/checkpoint-28/special_tokens_map.json +7 -0
run-8/checkpoint-28/tokenizer.json +0 -0
run-8/checkpoint-28/tokenizer_config.json +55 -0
run-8/checkpoint-28/trainer_state.json +44 -0
run-8/checkpoint-28/training_args.bin +3 -0
run-8/checkpoint-28/vocab.txt +0 -0
runs/Feb27_16-43-42_b3bc3fede2ea/events.out.tfevents.1709053090.b3bc3fede2ea.5958.8 +3 -0
runs/Feb27_16-43-42_b3bc3fede2ea/events.out.tfevents.1709053104.b3bc3fede2ea.5958.9 +3 -0
runs/Feb27_16-43-42_b3bc3fede2ea/events.out.tfevents.1709053108.b3bc3fede2ea.5958.10 +3 -0
runs/Feb27_16-43-42_b3bc3fede2ea/events.out.tfevents.1709053201.b3bc3fede2ea.5958.11 +3 -0
training_args.bin +1 -1

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7b7264777c389cb61e3202e49cd712d6a0a7c71278279effc9d1901b3bd91bac
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:05c6915b26fda6049e2fdb28bf64c10c7914ec7d20afb33eca758b8a496e19c2
 size 267832560

run-6/checkpoint-27/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-6/checkpoint-27/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:29af0fd1c86642810cfb5c9e0a1a5341cd29fd43201c1c76f8ffeb62ccb28960
+size 267832560

run-6/checkpoint-27/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f7a27f192d3a71915bb299e5b2af84bad81e173aa435db67b8f8f7dcc38ea4f1
+size 535727290

run-6/checkpoint-27/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:be2e61cfb32bd0131c8524d0f66b7881e91890fc6d136be5e1c3e92c518e8271
+size 14180

run-6/checkpoint-27/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:78211af0617a93ef10e44f30f019475c4d114e491e90b3e31e0177e344910fbc
+size 1064

run-6/checkpoint-27/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-27/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-6/checkpoint-27/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-6/checkpoint-27/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-6/checkpoint-27",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 27,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6180562973022461,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7927,
+      "eval_samples_per_second": 1315.68,
+      "eval_steps_per_second": 83.255,
+      "step": 27
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 81,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 6.155006780291272e-06,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 32,
+    "seed": 10
+  }
+}

run-6/checkpoint-27/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:576e8a633ebecf0dcad9ad36c9c1f24b8ae26286776e3e989c11ef48601b2eec
+size 4984

run-6/checkpoint-27/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-8/checkpoint-14/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-8/checkpoint-14/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9825860c6ec9bec4da4064495e4de0fcac3ad1e960e49586ab5d51f5c671ad36
+size 267832560

run-8/checkpoint-14/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e5577f9ec2e0420a5e7e51f3879ca5c0cfac55363a12d3f8a96b7f78f62261ba
+size 535727290

run-8/checkpoint-14/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b3c12604b72013b6685abf7ae7aa8cb19a8e2c467b5844ba4019e5919b528729
+size 14244

run-8/checkpoint-14/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b013582b777fd12efd3319f638f1b50db49ce12f41cced995000c40073b2cb8a
+size 1064

run-8/checkpoint-14/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-14/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-8/checkpoint-14/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-14/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-8/checkpoint-14",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 14,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6050807237625122,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.2093,
+      "eval_samples_per_second": 862.486,
+      "eval_steps_per_second": 54.577,
+      "step": 14
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 28,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 2,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 5.6377293486135757e-05,
+    "num_train_epochs": 2,
+    "per_device_train_batch_size": 64,
+    "seed": 16
+  }
+}

run-8/checkpoint-14/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9fad24c79917de56c27af5271c94818eabaf3f3872062c491ecc9c38c4cd3da4
+size 4984

run-8/checkpoint-14/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-8/checkpoint-28/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-8/checkpoint-28/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cb77ac3c816e23fddc1989318b47ec6ac27447fb86d367027ab6c003b01c79ce
+size 267832560

run-8/checkpoint-28/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bb956be810da1004a52381159b47a980a20bf9e4e257c5ac098d8cd160205b84
+size 535727290

run-8/checkpoint-28/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9c7c3bf419e85329b27667f364dd600c1604458e4c503bca245c2fce723e6009
+size 14244

run-8/checkpoint-28/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:af790769780716b1ffac659b155707486f29ca642b81e62f8d292e634f7c600b
+size 1064

run-8/checkpoint-28/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-28/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-8/checkpoint-28/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-8/checkpoint-28/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.0,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-8/checkpoint-14",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 28,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6050807237625122,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 1.2093,
+      "eval_samples_per_second": 862.486,
+      "eval_steps_per_second": 54.577,
+      "step": 14
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5790172815322876,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.8146,
+      "eval_samples_per_second": 1280.342,
+      "eval_steps_per_second": 81.019,
+      "step": 28
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 28,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 2,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 5.6377293486135757e-05,
+    "num_train_epochs": 2,
+    "per_device_train_batch_size": 64,
+    "seed": 16
+  }
+}

run-8/checkpoint-28/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9fad24c79917de56c27af5271c94818eabaf3f3872062c491ecc9c38c4cd3da4
+size 4984

run-8/checkpoint-28/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

runs/Feb27_16-43-42_b3bc3fede2ea/events.out.tfevents.1709053090.b3bc3fede2ea.5958.8 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6201e2b1bf2e7bd8ffc7efc36de34b7e4d40ee9436a622a871ff5a707f016137
+size 5200

runs/Feb27_16-43-42_b3bc3fede2ea/events.out.tfevents.1709053104.b3bc3fede2ea.5958.9 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:88eb749f333e459e4142a44d3a164ff49e3053422b6d3e1d73e55c29606fc0c1
+size 4872

runs/Feb27_16-43-42_b3bc3fede2ea/events.out.tfevents.1709053108.b3bc3fede2ea.5958.10 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:05ed7b23a5e4a07951a5464050961a62bd68f7a8e8251800a2b158c58dec250f
+size 5549

runs/Feb27_16-43-42_b3bc3fede2ea/events.out.tfevents.1709053201.b3bc3fede2ea.5958.11 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7e4f6ba3daa8913944b9b11fa271703e9418929c802525bf542ffc18e4fdf632
+size 6205

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:12789646f1ace8590d718854a0dcb7cbdcd7655dfa3e3b9eea3031d650c025e3
 size 4984

 version https://git-lfs.github.com/spec/v1
+oid sha256:9109f7e7761b3976c7e539cd75f703d1342c83a109dd00b8d10d602cf1dddf4d
 size 4984