krishnachnani commited on
Commit
8aa6f8f
1 Parent(s): 6efaa0a

End of training

Browse files
README.md CHANGED
@@ -2,6 +2,8 @@
2
  license: apache-2.0
3
  base_model: google/vit-base-patch16-224-in21k
4
  tags:
 
 
5
  - generated_from_trainer
6
  datasets:
7
  - imagefolder
 
2
  license: apache-2.0
3
  base_model: google/vit-base-patch16-224-in21k
4
  tags:
5
+ - image-classification
6
+ - vision
7
  - generated_from_trainer
8
  datasets:
9
  - imagefolder
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 5.0,
3
- "eval_accuracy": 1.0,
4
- "eval_loss": 0.6095926761627197,
5
- "eval_runtime": 0.0372,
6
- "eval_samples_per_second": 26.907,
7
- "eval_steps_per_second": 26.907,
8
- "train_loss": 0.5933201789855957,
9
- "train_runtime": 34.8635,
10
- "train_samples_per_second": 0.143,
11
- "train_steps_per_second": 0.143
12
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "eval_accuracy": 0.640625,
4
+ "eval_loss": 0.6650563478469849,
5
+ "eval_runtime": 1.0796,
6
+ "eval_samples_per_second": 59.281,
7
+ "eval_steps_per_second": 7.41,
8
+ "train_loss": 0.6482972621917724,
9
+ "train_runtime": 94.3242,
10
+ "train_samples_per_second": 0.848,
11
+ "train_steps_per_second": 0.106
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 5.0,
3
- "eval_accuracy": 1.0,
4
- "eval_loss": 0.6095926761627197,
5
- "eval_runtime": 0.0372,
6
- "eval_samples_per_second": 26.907,
7
- "eval_steps_per_second": 26.907
8
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "eval_accuracy": 0.640625,
4
+ "eval_loss": 0.6650563478469849,
5
+ "eval_runtime": 1.0796,
6
+ "eval_samples_per_second": 59.281,
7
+ "eval_steps_per_second": 7.41
8
  }
runs/Apr03_23-33-41_4da9d9357a4f/events.out.tfevents.1712187341.4da9d9357a4f.2580.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecf5e3825af8d41d58f3e54d2c5af77b17da059123bcbf0e8993be7e66e2ac5d
3
+ size 405
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 5.0,
3
- "train_loss": 0.5933201789855957,
4
- "train_runtime": 34.8635,
5
- "train_samples_per_second": 0.143,
6
- "train_steps_per_second": 0.143
7
  }
 
1
  {
2
  "epoch": 5.0,
3
+ "train_loss": 0.6482972621917724,
4
+ "train_runtime": 94.3242,
5
+ "train_samples_per_second": 0.848,
6
+ "train_steps_per_second": 0.106
7
  }
trainer_state.json CHANGED
@@ -1,74 +1,81 @@
1
  {
2
- "best_metric": 0.6095926761627197,
3
- "best_model_checkpoint": "./outputs/checkpoint-1",
4
  "epoch": 5.0,
5
  "eval_steps": 500,
6
- "global_step": 5,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 1.0,
14
- "eval_loss": 0.6095926761627197,
15
- "eval_runtime": 0.0508,
16
- "eval_samples_per_second": 19.702,
17
- "eval_steps_per_second": 19.702,
18
- "step": 1
19
  },
20
  {
21
  "epoch": 2.0,
22
- "eval_accuracy": 1.0,
23
- "eval_loss": 0.6161552667617798,
24
- "eval_runtime": 0.0531,
25
- "eval_samples_per_second": 18.826,
26
- "eval_steps_per_second": 18.826,
27
- "step": 2
28
  },
29
  {
30
  "epoch": 3.0,
31
- "eval_accuracy": 1.0,
32
- "eval_loss": 0.6204718947410583,
33
- "eval_runtime": 0.0536,
34
- "eval_samples_per_second": 18.649,
35
- "eval_steps_per_second": 18.649,
36
- "step": 3
37
  },
38
  {
39
  "epoch": 4.0,
40
- "eval_accuracy": 1.0,
41
- "eval_loss": 0.6235671043395996,
42
- "eval_runtime": 0.0594,
43
- "eval_samples_per_second": 16.824,
44
- "eval_steps_per_second": 16.824,
45
- "step": 4
 
 
 
 
 
 
 
46
  },
47
  {
48
  "epoch": 5.0,
49
- "eval_accuracy": 1.0,
50
- "eval_loss": 0.6252284646034241,
51
- "eval_runtime": 0.0612,
52
- "eval_samples_per_second": 16.331,
53
- "eval_steps_per_second": 16.331,
54
- "step": 5
55
  },
56
  {
57
  "epoch": 5.0,
58
- "step": 5,
59
- "total_flos": 387459948072960.0,
60
- "train_loss": 0.5933201789855957,
61
- "train_runtime": 34.8635,
62
- "train_samples_per_second": 0.143,
63
- "train_steps_per_second": 0.143
64
  }
65
  ],
66
  "logging_steps": 10,
67
- "max_steps": 5,
68
  "num_input_tokens_seen": 0,
69
  "num_train_epochs": 5,
70
  "save_steps": 500,
71
- "total_flos": 387459948072960.0,
72
  "train_batch_size": 8,
73
  "trial_name": null,
74
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.6650563478469849,
3
+ "best_model_checkpoint": "./outputs/checkpoint-10",
4
  "epoch": 5.0,
5
  "eval_steps": 500,
6
+ "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.5625,
14
+ "eval_loss": 0.6905453205108643,
15
+ "eval_runtime": 27.9364,
16
+ "eval_samples_per_second": 2.291,
17
+ "eval_steps_per_second": 0.286,
18
+ "step": 2
19
  },
20
  {
21
  "epoch": 2.0,
22
+ "eval_accuracy": 0.65625,
23
+ "eval_loss": 0.6797380447387695,
24
+ "eval_runtime": 1.0941,
25
+ "eval_samples_per_second": 58.493,
26
+ "eval_steps_per_second": 7.312,
27
+ "step": 4
28
  },
29
  {
30
  "epoch": 3.0,
31
+ "eval_accuracy": 0.65625,
32
+ "eval_loss": 0.67192143201828,
33
+ "eval_runtime": 1.0069,
34
+ "eval_samples_per_second": 63.562,
35
+ "eval_steps_per_second": 7.945,
36
+ "step": 6
37
  },
38
  {
39
  "epoch": 4.0,
40
+ "eval_accuracy": 0.65625,
41
+ "eval_loss": 0.6670976281166077,
42
+ "eval_runtime": 1.2194,
43
+ "eval_samples_per_second": 52.486,
44
+ "eval_steps_per_second": 6.561,
45
+ "step": 8
46
+ },
47
+ {
48
+ "epoch": 5.0,
49
+ "grad_norm": 1.3951447010040283,
50
+ "learning_rate": 0.0,
51
+ "loss": 0.6483,
52
+ "step": 10
53
  },
54
  {
55
  "epoch": 5.0,
56
+ "eval_accuracy": 0.640625,
57
+ "eval_loss": 0.6650563478469849,
58
+ "eval_runtime": 1.0203,
59
+ "eval_samples_per_second": 62.726,
60
+ "eval_steps_per_second": 7.841,
61
+ "step": 10
62
  },
63
  {
64
  "epoch": 5.0,
65
+ "step": 10,
66
+ "total_flos": 6199359169167360.0,
67
+ "train_loss": 0.6482972621917724,
68
+ "train_runtime": 94.3242,
69
+ "train_samples_per_second": 0.848,
70
+ "train_steps_per_second": 0.106
71
  }
72
  ],
73
  "logging_steps": 10,
74
+ "max_steps": 10,
75
  "num_input_tokens_seen": 0,
76
  "num_train_epochs": 5,
77
  "save_steps": 500,
78
+ "total_flos": 6199359169167360.0,
79
  "train_batch_size": 8,
80
  "trial_name": null,
81
  "trial_params": null