mrm8488 commited on Sep 16, 2021

Commit

9059152

1 Parent(s): 5720b66

Initial commit from mrm8488

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

README.md +76 -0
checkpoint-1020/config.json +39 -0
checkpoint-1020/merges.txt +0 -0
checkpoint-1020/optimizer.pt +3 -0
checkpoint-1020/pytorch_model.bin +3 -0
checkpoint-1020/rng_state.pth +3 -0
checkpoint-1020/scheduler.pt +3 -0
checkpoint-1020/special_tokens_map.json +1 -0
checkpoint-1020/tokenizer.json +0 -0
checkpoint-1020/tokenizer_config.json +1 -0
checkpoint-1020/trainer_state.json +64 -0
checkpoint-1020/training_args.bin +3 -0
checkpoint-1020/vocab.json +0 -0
checkpoint-1275/config.json +39 -0
checkpoint-1275/merges.txt +0 -0
checkpoint-1275/optimizer.pt +3 -0
checkpoint-1275/pytorch_model.bin +3 -0
checkpoint-1275/rng_state.pth +3 -0
checkpoint-1275/scheduler.pt +3 -0
checkpoint-1275/special_tokens_map.json +1 -0
checkpoint-1275/tokenizer.json +0 -0
checkpoint-1275/tokenizer_config.json +1 -0
checkpoint-1275/trainer_state.json +73 -0
checkpoint-1275/training_args.bin +3 -0
checkpoint-1275/vocab.json +0 -0
checkpoint-255/config.json +39 -0
checkpoint-255/merges.txt +0 -0
checkpoint-255/optimizer.pt +3 -0
checkpoint-255/pytorch_model.bin +3 -0
checkpoint-255/rng_state.pth +3 -0
checkpoint-255/scheduler.pt +3 -0
checkpoint-255/special_tokens_map.json +1 -0
checkpoint-255/tokenizer.json +0 -0
checkpoint-255/tokenizer_config.json +1 -0
checkpoint-255/trainer_state.json +25 -0
checkpoint-255/training_args.bin +3 -0
checkpoint-255/vocab.json +0 -0
checkpoint-510/config.json +39 -0
checkpoint-510/merges.txt +0 -0
checkpoint-510/optimizer.pt +3 -0
checkpoint-510/pytorch_model.bin +3 -0
checkpoint-510/rng_state.pth +3 -0
checkpoint-510/scheduler.pt +3 -0
checkpoint-510/special_tokens_map.json +1 -0
checkpoint-510/tokenizer.json +0 -0
checkpoint-510/tokenizer_config.json +1 -0
checkpoint-510/trainer_state.json +40 -0
checkpoint-510/training_args.bin +3 -0
checkpoint-510/vocab.json +0 -0
checkpoint-765/config.json +39 -0

README.md ADDED Viewed

	@@ -0,0 +1,76 @@

+---
+license: apache-2.0
+tags:
+- generated_from_trainer
+datasets:
+- financial_phrasebank
+metrics:
+- accuracy
+model-index:
+- name: distilRoberta-financial-sentiment
+  results:
+  - task:
+      name: Text Classification
+      type: text-classification
+    dataset:
+      name: financial_phrasebank
+      type: financial_phrasebank
+      args: sentences_allagree
+    metrics:
+    - name: Accuracy
+      type: accuracy
+      value: 0.9823008849557522
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# distilRoberta-financial-sentiment
+This model is a fine-tuned version of [distilroberta-base](https://huggingface.co/distilroberta-base) on the financial_phrasebank dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.1116
+- Accuracy: 0.9823
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 2e-05
+- train_batch_size: 8
+- eval_batch_size: 8
+- seed: 42
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: linear
+- num_epochs: 5
+### Training results
+| Training Loss | Epoch | Step | Validation Loss | Accuracy |
+|:-------------:|:-----:|:----:|:---------------:|:--------:|
+| No log        | 1.0   | 255  | 0.1670          | 0.9646   |
+| 0.209         | 2.0   | 510  | 0.2290          | 0.9558   |
+| 0.209         | 3.0   | 765  | 0.2044          | 0.9558   |
+| 0.0326        | 4.0   | 1020 | 0.1116          | 0.9823   |
+| 0.0326        | 5.0   | 1275 | 0.1127          | 0.9779   |
+### Framework versions
+- Transformers 4.10.2
+- Pytorch 1.9.0+cu102
+- Datasets 1.12.1
+- Tokenizers 0.10.3

checkpoint-1020/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_name_or_path": "distilroberta-base",
+  "architectures": [
+    "RobertaForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
+  "eos_token_id": 2,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 6,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.10.2",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 50265
+}

checkpoint-1020/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-1020/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3a10d139e099d856113f8f9bec12c657e6d97106685112c3f8f9090244f21ac6
+size 657026205

checkpoint-1020/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c6d24cd7c45f0b65241fd9ff1aa97814eea3ab7bdbf1458248fb9f4b2c817864
+size 328529005

checkpoint-1020/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:133c6f14a48205cfdb6ebb24164c59ba141f1b3bb6282c1a0f245e16e419918e
+size 14503

checkpoint-1020/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5b5fb5b60622a213ada574e87f31d8d1d9c80a4bff68598fca269c91968c006c
+size 623

checkpoint-1020/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "sep_token": "</s>", "pad_token": "<pad>", "cls_token": "<s>", "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false}}

checkpoint-1020/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-1020/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"unk_token": "<unk>", "bos_token": "<s>", "eos_token": "</s>", "add_prefix_space": false, "errors": "replace", "sep_token": "</s>", "cls_token": "<s>", "pad_token": "<pad>", "mask_token": "<mask>", "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "distilroberta-base", "tokenizer_class": "RobertaTokenizer"}

checkpoint-1020/trainer_state.json ADDED Viewed

	@@ -0,0 +1,64 @@

+{
+  "best_metric": 0.9823008849557522,
+  "best_model_checkpoint": "/content/drive/MyDrive/distilRoberta-financial-sentiment/checkpoint-1020",
+  "epoch": 4.0,
+  "global_step": 1020,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.9646017699115044,
+      "eval_loss": 0.16703279316425323,
+      "eval_runtime": 0.4253,
+      "eval_samples_per_second": 531.427,
+      "eval_steps_per_second": 68.192,
+      "step": 255
+    },
+    {
+      "epoch": 1.96,
+      "learning_rate": 1.215686274509804e-05,
+      "loss": 0.209,
+      "step": 500
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.9557522123893806,
+      "eval_loss": 0.22898824512958527,
+      "eval_runtime": 0.4057,
+      "eval_samples_per_second": 557.077,
+      "eval_steps_per_second": 71.483,
+      "step": 510
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.9557522123893806,
+      "eval_loss": 0.20438142120838165,
+      "eval_runtime": 0.4213,
+      "eval_samples_per_second": 536.442,
+      "eval_steps_per_second": 68.835,
+      "step": 765
+    },
+    {
+      "epoch": 3.92,
+      "learning_rate": 4.313725490196079e-06,
+      "loss": 0.0326,
+      "step": 1000
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.9823008849557522,
+      "eval_loss": 0.11158797889947891,
+      "eval_runtime": 0.4245,
+      "eval_samples_per_second": 532.332,
+      "eval_steps_per_second": 68.308,
+      "step": 1020
+    }
+  ],
+  "max_steps": 1275,
+  "num_train_epochs": 5,
+  "total_flos": 109104889463388.0,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-1020/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee1178219233a39de3467c1d1c9ad2fd1d976e51b9ed6bb5a459131607445eaf
+size 2735

checkpoint-1020/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-1275/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_name_or_path": "distilroberta-base",
+  "architectures": [
+    "RobertaForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
+  "eos_token_id": 2,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 6,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.10.2",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 50265
+}

checkpoint-1275/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-1275/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:75fcbedc38d2c17d18ac54e29a3a67ef140ebce4c29e1c97100eb85ffa994859
+size 657026205

checkpoint-1275/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f8c9cd771ae142b084f337b48bc6d3ef08344519e7e8b800d65d7581ffd1f6dc
+size 328529005

checkpoint-1275/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:60e92978b58e882b21cd2cb09760e0deb38b0133cae445d92efa6a28baa781a7
+size 14503

checkpoint-1275/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c0b3ce3a7534d3726f9e692752affc1b48524ec0f784701f84651de3aca1e0f0
+size 623

checkpoint-1275/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "sep_token": "</s>", "pad_token": "<pad>", "cls_token": "<s>", "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false}}

checkpoint-1275/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-1275/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"unk_token": "<unk>", "bos_token": "<s>", "eos_token": "</s>", "add_prefix_space": false, "errors": "replace", "sep_token": "</s>", "cls_token": "<s>", "pad_token": "<pad>", "mask_token": "<mask>", "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "distilroberta-base", "tokenizer_class": "RobertaTokenizer"}

checkpoint-1275/trainer_state.json ADDED Viewed

	@@ -0,0 +1,73 @@

+{
+  "best_metric": 0.9823008849557522,
+  "best_model_checkpoint": "/content/drive/MyDrive/distilRoberta-financial-sentiment/checkpoint-1020",
+  "epoch": 5.0,
+  "global_step": 1275,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.9646017699115044,
+      "eval_loss": 0.16703279316425323,
+      "eval_runtime": 0.4253,
+      "eval_samples_per_second": 531.427,
+      "eval_steps_per_second": 68.192,
+      "step": 255
+    },
+    {
+      "epoch": 1.96,
+      "learning_rate": 1.215686274509804e-05,
+      "loss": 0.209,
+      "step": 500
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.9557522123893806,
+      "eval_loss": 0.22898824512958527,
+      "eval_runtime": 0.4057,
+      "eval_samples_per_second": 557.077,
+      "eval_steps_per_second": 71.483,
+      "step": 510
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.9557522123893806,
+      "eval_loss": 0.20438142120838165,
+      "eval_runtime": 0.4213,
+      "eval_samples_per_second": 536.442,
+      "eval_steps_per_second": 68.835,
+      "step": 765
+    },
+    {
+      "epoch": 3.92,
+      "learning_rate": 4.313725490196079e-06,
+      "loss": 0.0326,
+      "step": 1000
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.9823008849557522,
+      "eval_loss": 0.11158797889947891,
+      "eval_runtime": 0.4245,
+      "eval_samples_per_second": 532.332,
+      "eval_steps_per_second": 68.308,
+      "step": 1020
+    },
+    {
+      "epoch": 5.0,
+      "eval_accuracy": 0.9778761061946902,
+      "eval_loss": 0.11265852302312851,
+      "eval_runtime": 0.431,
+      "eval_samples_per_second": 524.402,
+      "eval_steps_per_second": 67.291,
+      "step": 1275
+    }
+  ],
+  "max_steps": 1275,
+  "num_train_epochs": 5,
+  "total_flos": 136563387115644.0,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-1275/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee1178219233a39de3467c1d1c9ad2fd1d976e51b9ed6bb5a459131607445eaf
+size 2735

checkpoint-1275/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-255/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_name_or_path": "distilroberta-base",
+  "architectures": [
+    "RobertaForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
+  "eos_token_id": 2,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 6,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.10.2",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 50265
+}

checkpoint-255/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-255/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:975b1ebc8d6a6c90134f55202316d19b3e80107d206c614021d293fd65c24106
+size 657026077

checkpoint-255/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b4b733235868bb0ec23026fbf9503e44701a09e253c725f4e3c48d9010d9119b
+size 328529005

checkpoint-255/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8a3a992b385bfed8a7947f3349b47e31d3a41012ea7e604ba8930022525ee395
+size 14503

checkpoint-255/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bf9b70b1312ed602ec4c2ce9c481f61d1ea9d352599c28f99624d803ef1abbb2
+size 623

checkpoint-255/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "sep_token": "</s>", "pad_token": "<pad>", "cls_token": "<s>", "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false}}

checkpoint-255/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-255/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"unk_token": "<unk>", "bos_token": "<s>", "eos_token": "</s>", "add_prefix_space": false, "errors": "replace", "sep_token": "</s>", "cls_token": "<s>", "pad_token": "<pad>", "mask_token": "<mask>", "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "distilroberta-base", "tokenizer_class": "RobertaTokenizer"}

checkpoint-255/trainer_state.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "best_metric": 0.9646017699115044,
+  "best_model_checkpoint": "/content/drive/MyDrive/distilRoberta-financial-sentiment/checkpoint-255",
+  "epoch": 1.0,
+  "global_step": 255,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.9646017699115044,
+      "eval_loss": 0.16703279316425323,
+      "eval_runtime": 0.4253,
+      "eval_samples_per_second": 531.427,
+      "eval_steps_per_second": 68.192,
+      "step": 255
+    }
+  ],
+  "max_steps": 1275,
+  "num_train_epochs": 5,
+  "total_flos": 27420205611960.0,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-255/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee1178219233a39de3467c1d1c9ad2fd1d976e51b9ed6bb5a459131607445eaf
+size 2735

checkpoint-255/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-510/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_name_or_path": "distilroberta-base",
+  "architectures": [
+    "RobertaForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
+  "eos_token_id": 2,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 6,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.10.2",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 50265
+}

checkpoint-510/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-510/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8d8bcdb6b232b75268539ac908094b87c2485cf9f72e43a602596e731db2ac2a
+size 657026205

checkpoint-510/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6d037b8e1adbc44aa7ac023e87cbc070f9e38fbff4760759f77d7908d06af361
+size 328529005

checkpoint-510/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:48a061e86b42b51652875e3d2f31f7c4fa9b52250106d33553f74eb06c82ac04
+size 14503

checkpoint-510/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fcc0a142708d96432e37e864dacf92fbffed7431324f0234396de039f88c9435
+size 623

checkpoint-510/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "sep_token": "</s>", "pad_token": "<pad>", "cls_token": "<s>", "mask_token": {"content": "<mask>", "single_word": false, "lstrip": true, "rstrip": false, "normalized": false}}

checkpoint-510/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-510/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"unk_token": "<unk>", "bos_token": "<s>", "eos_token": "</s>", "add_prefix_space": false, "errors": "replace", "sep_token": "</s>", "cls_token": "<s>", "pad_token": "<pad>", "mask_token": "<mask>", "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "distilroberta-base", "tokenizer_class": "RobertaTokenizer"}

checkpoint-510/trainer_state.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "best_metric": 0.9646017699115044,
+  "best_model_checkpoint": "/content/drive/MyDrive/distilRoberta-financial-sentiment/checkpoint-255",
+  "epoch": 2.0,
+  "global_step": 510,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.9646017699115044,
+      "eval_loss": 0.16703279316425323,
+      "eval_runtime": 0.4253,
+      "eval_samples_per_second": 531.427,
+      "eval_steps_per_second": 68.192,
+      "step": 255
+    },
+    {
+      "epoch": 1.96,
+      "learning_rate": 1.215686274509804e-05,
+      "loss": 0.209,
+      "step": 500
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.9557522123893806,
+      "eval_loss": 0.22898824512958527,
+      "eval_runtime": 0.4057,
+      "eval_samples_per_second": 557.077,
+      "eval_steps_per_second": 71.483,
+      "step": 510
+    }
+  ],
+  "max_steps": 1275,
+  "num_train_epochs": 5,
+  "total_flos": 54781938243468.0,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-510/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee1178219233a39de3467c1d1c9ad2fd1d976e51b9ed6bb5a459131607445eaf
+size 2735

checkpoint-510/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-765/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_name_or_path": "distilroberta-base",
+  "architectures": [
+    "RobertaForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
+  "eos_token_id": 2,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 6,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.10.2",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 50265
+}