pkr7098 commited on
Commit
d07588c
1 Parent(s): c1af32c

End of training

Browse files
Files changed (5) hide show
  1. README.md +3 -1
  2. all_results.json +10 -10
  3. eval_results.json +5 -5
  4. train_results.json +5 -5
  5. trainer_state.json +0 -0
README.md CHANGED
@@ -5,6 +5,8 @@ license: apache-2.0
5
  metrics:
6
  - accuracy
7
  tags:
 
 
8
  - generated_from_trainer
9
  model-index:
10
  - name: vit-cifar100-cifar100
@@ -16,7 +18,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # vit-cifar100-cifar100
18
 
19
- This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
  - Loss: 0.2550
22
  - Accuracy: 0.9236
 
5
  metrics:
6
  - accuracy
7
  tags:
8
+ - image-classification
9
+ - vision
10
  - generated_from_trainer
11
  model-index:
12
  - name: vit-cifar100-cifar100
 
18
 
19
  # vit-cifar100-cifar100
20
 
21
+ This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the cifar100 dataset.
22
  It achieves the following results on the evaluation set:
23
  - Loss: 0.2550
24
  - Accuracy: 0.9236
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 5.0,
3
- "eval_accuracy": 0.9252,
4
- "eval_loss": 0.2850923240184784,
5
- "eval_runtime": 284.1065,
6
- "eval_samples_per_second": 26.399,
7
- "eval_steps_per_second": 3.302,
8
- "total_flos": 1.64815115092992e+19,
9
- "train_loss": 1.0248974845253678,
10
- "train_runtime": 12727.7584,
11
- "train_samples_per_second": 16.696,
12
- "train_steps_per_second": 2.087
13
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "eval_accuracy": 0.9236,
4
+ "eval_loss": 0.2550007104873657,
5
+ "eval_runtime": 61.8129,
6
+ "eval_samples_per_second": 121.334,
7
+ "eval_steps_per_second": 15.175,
8
+ "total_flos": 1.66660717676544e+19,
9
+ "train_loss": 0.7802943237124471,
10
+ "train_runtime": 11340.9032,
11
+ "train_samples_per_second": 18.737,
12
+ "train_steps_per_second": 2.342
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 5.0,
3
- "eval_accuracy": 0.9252,
4
- "eval_loss": 0.2850923240184784,
5
- "eval_runtime": 284.1065,
6
- "eval_samples_per_second": 26.399,
7
- "eval_steps_per_second": 3.302
8
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "eval_accuracy": 0.9236,
4
+ "eval_loss": 0.2550007104873657,
5
+ "eval_runtime": 61.8129,
6
+ "eval_samples_per_second": 121.334,
7
+ "eval_steps_per_second": 15.175
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 5.0,
3
- "total_flos": 1.64815115092992e+19,
4
- "train_loss": 1.0248974845253678,
5
- "train_runtime": 12727.7584,
6
- "train_samples_per_second": 16.696,
7
- "train_steps_per_second": 2.087
8
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "total_flos": 1.66660717676544e+19,
4
+ "train_loss": 0.7802943237124471,
5
+ "train_runtime": 11340.9032,
6
+ "train_samples_per_second": 18.737,
7
+ "train_steps_per_second": 2.342
8
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff