EternalQuest commited on
Commit
e5e9967
1 Parent(s): 346dbd7

End of training

Browse files
README.md CHANGED
@@ -1,6 +1,6 @@
1
  ---
2
  license: apache-2.0
3
- base_model: distilbert-base-uncased
4
  tags:
5
  - generated_from_trainer
6
  metrics:
@@ -15,10 +15,10 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # my_awesome_model
17
 
18
- This model is a fine-tuned version of [distilbert-base-uncased](https://huggingface.co/distilbert-base-uncased) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.2363
21
- - Accuracy: 0.9309
22
 
23
  ## Model description
24
 
@@ -49,8 +49,8 @@ The following hyperparameters were used during training:
49
 
50
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
51
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
52
- | 0.2245 | 1.0 | 1563 | 0.2030 | 0.9215 |
53
- | 0.1455 | 2.0 | 3126 | 0.2363 | 0.9309 |
54
 
55
 
56
  ### Framework versions
 
1
  ---
2
  license: apache-2.0
3
+ base_model: distilbert-base-uncased-finetuned-sst-2-english
4
  tags:
5
  - generated_from_trainer
6
  metrics:
 
15
 
16
  # my_awesome_model
17
 
18
+ This model is a fine-tuned version of [distilbert-base-uncased-finetuned-sst-2-english](https://huggingface.co/distilbert-base-uncased-finetuned-sst-2-english) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 0.2367
21
+ - Accuracy: 0.9343
22
 
23
  ## Model description
24
 
 
49
 
50
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
51
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
52
+ | 0.2089 | 1.0 | 1563 | 0.1805 | 0.9315 |
53
+ | 0.133 | 2.0 | 3126 | 0.2367 | 0.9343 |
54
 
55
 
56
  ### Framework versions
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "distilbert-base-uncased",
3
  "activation": "gelu",
4
  "architectures": [
5
  "DistilBertForSequenceClassification"
@@ -7,6 +7,7 @@
7
  "attention_dropout": 0.1,
8
  "dim": 768,
9
  "dropout": 0.1,
 
10
  "hidden_dim": 3072,
11
  "id2label": {
12
  "0": "NEGATIVE",
@@ -21,6 +22,7 @@
21
  "model_type": "distilbert",
22
  "n_heads": 12,
23
  "n_layers": 6,
 
24
  "pad_token_id": 0,
25
  "problem_type": "single_label_classification",
26
  "qa_dropout": 0.1,
 
1
  {
2
+ "_name_or_path": "distilbert-base-uncased-finetuned-sst-2-english",
3
  "activation": "gelu",
4
  "architectures": [
5
  "DistilBertForSequenceClassification"
 
7
  "attention_dropout": 0.1,
8
  "dim": 768,
9
  "dropout": 0.1,
10
+ "finetuning_task": "sst-2",
11
  "hidden_dim": 3072,
12
  "id2label": {
13
  "0": "NEGATIVE",
 
22
  "model_type": "distilbert",
23
  "n_heads": 12,
24
  "n_layers": 6,
25
+ "output_past": true,
26
  "pad_token_id": 0,
27
  "problem_type": "single_label_classification",
28
  "qa_dropout": 0.1,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:da0eed05160a71ad0d1c2a3892f7258a4f8765b0fb10811b58e827a5901d94a4
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac71ac7ca38fd58f656f39293ecf3f8eb90a4224b3be56f0ff7a4956498368a3
3
  size 267832560
runs/Aug05_11-37-45_6dce5b3955ed/events.out.tfevents.1722857867.6dce5b3955ed.801.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18e72be1523c82b192f9839eb92911f739398fd8b198e01c6ca6b87c646f4c05
3
+ size 7195
tokenizer.json CHANGED
@@ -1,6 +1,11 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 512,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
  "padding": null,
10
  "added_tokens": [
11
  {
tokenizer_config.json CHANGED
@@ -43,9 +43,11 @@
43
  },
44
  "clean_up_tokenization_spaces": true,
45
  "cls_token": "[CLS]",
 
46
  "do_lower_case": true,
47
  "mask_token": "[MASK]",
48
  "model_max_length": 512,
 
49
  "pad_token": "[PAD]",
50
  "sep_token": "[SEP]",
51
  "strip_accents": null,
 
43
  },
44
  "clean_up_tokenization_spaces": true,
45
  "cls_token": "[CLS]",
46
+ "do_basic_tokenize": true,
47
  "do_lower_case": true,
48
  "mask_token": "[MASK]",
49
  "model_max_length": 512,
50
+ "never_split": null,
51
  "pad_token": "[PAD]",
52
  "sep_token": "[SEP]",
53
  "strip_accents": null,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f6197da3cb2e825692a1c4f0cb38f170424498fb93c82c1467b316ba63e167a
3
  size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54641bf57555c343f01a033390c6ce34c3f34a66c85a2a276ff59958acc329b7
3
  size 5112