Shresthadev403 commited on
Commit
8ea10e9
1 Parent(s): a7c2449

End of training

Browse files
README.md CHANGED
@@ -17,13 +17,13 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the food101 dataset.
19
  It achieves the following results on the evaluation set:
20
- - eval_loss: 0.7518
21
- - eval_accuracy: 0.8152
22
- - eval_runtime: 153.2443
23
- - eval_samples_per_second: 98.862
24
- - eval_steps_per_second: 6.18
25
- - epoch: 19.01
26
- - step: 18000
27
 
28
  ## Model description
29
 
 
17
 
18
  This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the food101 dataset.
19
  It achieves the following results on the evaluation set:
20
+ - eval_loss: 0.7491
21
+ - eval_accuracy: 0.8158
22
+ - eval_runtime: 155.8688
23
+ - eval_samples_per_second: 97.197
24
+ - eval_steps_per_second: 6.076
25
+ - epoch: 20.06
26
+ - step: 19000
27
 
28
  ## Model description
29
 
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25eb29a43d1c3706c53a685065c6e3c7c500f7243e2151d946001a94203235e2
3
  size 343528508
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9ac3ed48fc0d059f0736adfc532f21593147294028cb213e5c701923590d131
3
  size 343528508
runs/Feb05_03-08-58_983d148b451b/events.out.tfevents.1707102539.983d148b451b.26.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc9304e21c3c2f1e31882a2e82185835820969fdeb90c4999dc1436d1cf932b8
3
- size 17959
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d36c2d904aa5c076536490d5fd2055eb4be73336d3bb8f672fb68682e3aadaf1
3
+ size 18448
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.8158415841584158,
3
  "best_model_checkpoint": "food-image-classification/checkpoint-16000",
4
- "epoch": 19.00739176346357,
5
  "eval_steps": 1000,
6
- "global_step": 18000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -277,6 +277,21 @@
277
  "eval_samples_per_second": 98.862,
278
  "eval_steps_per_second": 6.18,
279
  "step": 18000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
280
  }
281
  ],
282
  "logging_steps": 1000,
@@ -284,7 +299,7 @@
284
  "num_input_tokens_seen": 0,
285
  "num_train_epochs": 500,
286
  "save_steps": 1000,
287
- "total_flos": 8.933819326583316e+19,
288
  "train_batch_size": 16,
289
  "trial_name": null,
290
  "trial_params": null
 
1
  {
2
  "best_metric": 0.8158415841584158,
3
  "best_model_checkpoint": "food-image-classification/checkpoint-16000",
4
+ "epoch": 20.06335797254488,
5
  "eval_steps": 1000,
6
+ "global_step": 19000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
277
  "eval_samples_per_second": 98.862,
278
  "eval_steps_per_second": 6.18,
279
  "step": 18000
280
+ },
281
+ {
282
+ "epoch": 20.06,
283
+ "learning_rate": 2.006335797254488e-05,
284
+ "loss": 0.4656,
285
+ "step": 19000
286
+ },
287
+ {
288
+ "epoch": 20.06,
289
+ "eval_accuracy": 0.8158415841584158,
290
+ "eval_loss": 0.7491214275360107,
291
+ "eval_runtime": 155.8688,
292
+ "eval_samples_per_second": 97.197,
293
+ "eval_steps_per_second": 6.076,
294
+ "step": 19000
295
  }
296
  ],
297
  "logging_steps": 1000,
 
299
  "num_input_tokens_seen": 0,
300
  "num_train_epochs": 500,
301
  "save_steps": 1000,
302
+ "total_flos": 9.430146069648998e+19,
303
  "train_batch_size": 16,
304
  "trial_name": null,
305
  "trial_params": null