Shresthadev403 commited on
Commit
0730770
1 Parent(s): 1a902bf

End of training

Browse files
README.md CHANGED
@@ -17,13 +17,13 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the food101 dataset.
19
  It achieves the following results on the evaluation set:
20
- - eval_loss: 4.5759
21
- - eval_accuracy: 0.0349
22
- - eval_runtime: 157.053
23
- - eval_samples_per_second: 96.464
24
- - eval_steps_per_second: 6.03
25
- - epoch: 1.06
26
- - step: 1000
27
 
28
  ## Model description
29
 
 
17
 
18
  This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the food101 dataset.
19
  It achieves the following results on the evaluation set:
20
+ - eval_loss: 4.3789
21
+ - eval_accuracy: 0.3104
22
+ - eval_runtime: 154.3948
23
+ - eval_samples_per_second: 98.125
24
+ - eval_steps_per_second: 6.134
25
+ - epoch: 2.11
26
+ - step: 2000
27
 
28
  ## Model description
29
 
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4eabec32f0ba76003916089cd24abcbfceda6bc9f6dbc42c9f42b2fc063a8f2e
3
  size 343528508
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eeb12dca342515db73c7bc5e69f8b9003ed35f85c1ce8b02d9dd43a388f4dd44
3
  size 343528508
runs/Feb05_03-08-58_983d148b451b/events.out.tfevents.1707102539.983d148b451b.26.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8637b62b758fd8d7af76bf6901bf4667283d0e4976458e3bb304993167e435a2
3
- size 9781
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:834296abb97fa742bf1375c1e8b811bdd982a60dda439d88177ff3ebb4dce784
3
+ size 10261
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 1.0559662090813093,
5
  "eval_steps": 1000,
6
- "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -22,6 +22,21 @@
22
  "eval_samples_per_second": 96.464,
23
  "eval_steps_per_second": 6.03,
24
  "step": 1000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  }
26
  ],
27
  "logging_steps": 1000,
@@ -29,7 +44,7 @@
29
  "num_input_tokens_seen": 0,
30
  "num_train_epochs": 500,
31
  "save_steps": 1000,
32
- "total_flos": 4.963267430656819e+18,
33
  "train_batch_size": 16,
34
  "trial_name": null,
35
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.034851485148514855,
3
+ "best_model_checkpoint": "food-image-classification/checkpoint-1000",
4
+ "epoch": 2.1119324181626187,
5
  "eval_steps": 1000,
6
+ "global_step": 2000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
22
  "eval_samples_per_second": 96.464,
23
  "eval_steps_per_second": 6.03,
24
  "step": 1000
25
+ },
26
+ {
27
+ "epoch": 2.11,
28
+ "learning_rate": 2.111932418162619e-06,
29
+ "loss": 4.4899,
30
+ "step": 2000
31
+ },
32
+ {
33
+ "epoch": 2.11,
34
+ "eval_accuracy": 0.3103630363036304,
35
+ "eval_loss": 4.3788862228393555,
36
+ "eval_runtime": 154.3948,
37
+ "eval_samples_per_second": 98.125,
38
+ "eval_steps_per_second": 6.134,
39
+ "step": 2000
40
  }
41
  ],
42
  "logging_steps": 1000,
 
44
  "num_input_tokens_seen": 0,
45
  "num_train_epochs": 500,
46
  "save_steps": 1000,
47
+ "total_flos": 9.926534861313638e+18,
48
  "train_batch_size": 16,
49
  "trial_name": null,
50
  "trial_params": null