Bul11k commited on
Commit
c3b473a
1 Parent(s): 93fb266

End of training

Browse files
README.md CHANGED
@@ -3,6 +3,8 @@ license: mit
3
  base_model: cointegrated/rubert-tiny
4
  tags:
5
  - generated_from_trainer
 
 
6
  model-index:
7
  - name: finetuned-tiny-bert
8
  results: []
@@ -14,6 +16,9 @@ should probably proofread and complete it, then remove this comment. -->
14
  # finetuned-tiny-bert
15
 
16
  This model is a fine-tuned version of [cointegrated/rubert-tiny](https://huggingface.co/cointegrated/rubert-tiny) on an unknown dataset.
 
 
 
17
 
18
  ## Model description
19
 
 
3
  base_model: cointegrated/rubert-tiny
4
  tags:
5
  - generated_from_trainer
6
+ metrics:
7
+ - accuracy
8
  model-index:
9
  - name: finetuned-tiny-bert
10
  results: []
 
16
  # finetuned-tiny-bert
17
 
18
  This model is a fine-tuned version of [cointegrated/rubert-tiny](https://huggingface.co/cointegrated/rubert-tiny) on an unknown dataset.
19
+ It achieves the following results on the evaluation set:
20
+ - Loss: 2.5832
21
+ - Accuracy: 0.5167
22
 
23
  ## Model description
24
 
all_results.json CHANGED
@@ -2,14 +2,14 @@
2
  "epoch": 1.0,
3
  "eval_accuracy": 0.5167136043030395,
4
  "eval_loss": 2.5832159519195557,
5
- "eval_runtime": 62.4515,
6
  "eval_samples": 15263,
7
- "eval_samples_per_second": 244.398,
8
- "eval_steps_per_second": 7.638,
9
  "perplexity": 13.23964783936109,
10
  "train_loss": 3.04393067064311,
11
- "train_runtime": 385.498,
12
  "train_samples": 35613,
13
- "train_samples_per_second": 92.382,
14
- "train_steps_per_second": 2.887
15
  }
 
2
  "epoch": 1.0,
3
  "eval_accuracy": 0.5167136043030395,
4
  "eval_loss": 2.5832159519195557,
5
+ "eval_runtime": 62.4114,
6
  "eval_samples": 15263,
7
+ "eval_samples_per_second": 244.555,
8
+ "eval_steps_per_second": 7.643,
9
  "perplexity": 13.23964783936109,
10
  "train_loss": 3.04393067064311,
11
+ "train_runtime": 388.0084,
12
  "train_samples": 35613,
13
+ "train_samples_per_second": 91.784,
14
+ "train_steps_per_second": 2.868
15
  }
eval_results.json CHANGED
@@ -2,9 +2,9 @@
2
  "epoch": 1.0,
3
  "eval_accuracy": 0.5167136043030395,
4
  "eval_loss": 2.5832159519195557,
5
- "eval_runtime": 62.4515,
6
  "eval_samples": 15263,
7
- "eval_samples_per_second": 244.398,
8
- "eval_steps_per_second": 7.638,
9
  "perplexity": 13.23964783936109
10
  }
 
2
  "epoch": 1.0,
3
  "eval_accuracy": 0.5167136043030395,
4
  "eval_loss": 2.5832159519195557,
5
+ "eval_runtime": 62.4114,
6
  "eval_samples": 15263,
7
+ "eval_samples_per_second": 244.555,
8
+ "eval_steps_per_second": 7.643,
9
  "perplexity": 13.23964783936109
10
  }
runs/Feb25_10-54-45_e77a61bc3de0/events.out.tfevents.1708858943.e77a61bc3de0.13217.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cd2482654241dd4697dcc72aaa9f2a7ef1b8ac0b48ec107fd59376a7ed0f6c5
3
+ size 411
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
  "train_loss": 3.04393067064311,
4
- "train_runtime": 385.498,
5
  "train_samples": 35613,
6
- "train_samples_per_second": 92.382,
7
- "train_steps_per_second": 2.887
8
  }
 
1
  {
2
  "epoch": 1.0,
3
  "train_loss": 3.04393067064311,
4
+ "train_runtime": 388.0084,
5
  "train_samples": 35613,
6
+ "train_samples_per_second": 91.784,
7
+ "train_steps_per_second": 2.868
8
  }
trainer_state.json CHANGED
@@ -27,9 +27,9 @@
27
  "step": 1113,
28
  "total_flos": 159583189651080.0,
29
  "train_loss": 3.04393067064311,
30
- "train_runtime": 385.498,
31
- "train_samples_per_second": 92.382,
32
- "train_steps_per_second": 2.887
33
  }
34
  ],
35
  "logging_steps": 500,
 
27
  "step": 1113,
28
  "total_flos": 159583189651080.0,
29
  "train_loss": 3.04393067064311,
30
+ "train_runtime": 388.0084,
31
+ "train_samples_per_second": 91.784,
32
+ "train_steps_per_second": 2.868
33
  }
34
  ],
35
  "logging_steps": 500,