dima806 commited on
Commit
c423eea
1 Parent(s): 2f915fb

Upload folder using huggingface_hub

Browse files
checkpoint-4098/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:799e436ba9dae406587780e581adc068c714652b56e1cf47c479634c697a8111
3
  size 343368556
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7584bee441a46ff02eaabaf77128796f7ce04506a497a42af795348c96b05551
3
  size 343368556
checkpoint-4098/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:596e3fbc6266f3d044c381838444742f8585677383ebb9f0c0f36053a1f41bf0
3
  size 686857605
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6506a7b9414316ab905d68d8fbc10617fc0981edf7ef6c2eb3ecc5f01eea5680
3
  size 686857605
checkpoint-4098/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 3.0359206199645996,
3
  "best_model_checkpoint": "military_aircraft_image_detection/checkpoint-4098",
4
  "epoch": 6.0,
5
  "eval_steps": 500,
@@ -10,112 +10,112 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.7320644216691069,
13
- "grad_norm": 1.6647233963012695,
14
  "learning_rate": 1.7776679841897234e-07,
15
- "loss": 2.9861,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 1.0,
20
- "eval_accuracy": 0.5055658627087198,
21
- "eval_loss": 3.063667058944702,
22
- "eval_runtime": 424.0571,
23
- "eval_samples_per_second": 68.637,
24
- "eval_steps_per_second": 2.146,
25
  "step": 683
26
  },
27
  {
28
  "epoch": 1.4641288433382138,
29
- "grad_norm": 1.5988911390304565,
30
  "learning_rate": 1.5306324110671935e-07,
31
- "loss": 2.9774,
32
  "step": 1000
33
  },
34
  {
35
  "epoch": 2.0,
36
- "eval_accuracy": 0.5072150072150072,
37
- "eval_loss": 3.0537939071655273,
38
- "eval_runtime": 426.3521,
39
- "eval_samples_per_second": 68.268,
40
- "eval_steps_per_second": 2.134,
41
  "step": 1366
42
  },
43
  {
44
  "epoch": 2.1961932650073206,
45
- "grad_norm": 1.980846643447876,
46
  "learning_rate": 1.283596837944664e-07,
47
- "loss": 2.9709,
48
  "step": 1500
49
  },
50
  {
51
  "epoch": 2.9282576866764276,
52
- "grad_norm": 1.8870298862457275,
53
  "learning_rate": 1.0365612648221343e-07,
54
- "loss": 2.9632,
55
  "step": 2000
56
  },
57
  {
58
  "epoch": 3.0,
59
- "eval_accuracy": 0.5092420806706521,
60
- "eval_loss": 3.046130895614624,
61
- "eval_runtime": 420.1974,
62
- "eval_samples_per_second": 69.267,
63
- "eval_steps_per_second": 2.166,
64
  "step": 2049
65
  },
66
  {
67
  "epoch": 3.660322108345534,
68
- "grad_norm": 1.7387105226516724,
69
  "learning_rate": 7.895256916996047e-08,
70
- "loss": 2.9561,
71
  "step": 2500
72
  },
73
  {
74
  "epoch": 4.0,
75
- "eval_accuracy": 0.5113035113035113,
76
- "eval_loss": 3.040210485458374,
77
- "eval_runtime": 421.3061,
78
- "eval_samples_per_second": 69.085,
79
- "eval_steps_per_second": 2.16,
80
  "step": 2732
81
  },
82
  {
83
  "epoch": 4.392386530014641,
84
- "grad_norm": 1.7102471590042114,
85
  "learning_rate": 5.4249011857707506e-08,
86
- "loss": 2.9553,
87
  "step": 3000
88
  },
89
  {
90
  "epoch": 5.0,
91
- "eval_accuracy": 0.5126090840376555,
92
- "eval_loss": 3.0369255542755127,
93
- "eval_runtime": 421.777,
94
- "eval_samples_per_second": 69.008,
95
- "eval_steps_per_second": 2.158,
96
  "step": 3415
97
  },
98
  {
99
  "epoch": 5.124450951683748,
100
- "grad_norm": 1.660888910293579,
101
  "learning_rate": 2.9545454545454546e-08,
102
- "loss": 2.9493,
103
  "step": 3500
104
  },
105
  {
106
  "epoch": 5.856515373352855,
107
- "grad_norm": 1.8840000629425049,
108
  "learning_rate": 4.8418972332015805e-09,
109
- "loss": 2.9496,
110
  "step": 4000
111
  },
112
  {
113
  "epoch": 6.0,
114
- "eval_accuracy": 0.5126777983920842,
115
- "eval_loss": 3.0359206199645996,
116
- "eval_runtime": 430.3036,
117
- "eval_samples_per_second": 67.641,
118
- "eval_steps_per_second": 2.115,
119
  "step": 4098
120
  }
121
  ],
 
1
  {
2
+ "best_metric": 2.96836519241333,
3
  "best_model_checkpoint": "military_aircraft_image_detection/checkpoint-4098",
4
  "epoch": 6.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.7320644216691069,
13
+ "grad_norm": 1.73904550075531,
14
  "learning_rate": 1.7776679841897234e-07,
15
+ "loss": 2.9196,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 1.0,
20
+ "eval_accuracy": 0.5273139558853844,
21
+ "eval_loss": 2.9956250190734863,
22
+ "eval_runtime": 433.4755,
23
+ "eval_samples_per_second": 67.146,
24
+ "eval_steps_per_second": 2.099,
25
  "step": 683
26
  },
27
  {
28
  "epoch": 1.4641288433382138,
29
+ "grad_norm": 1.7973357439041138,
30
  "learning_rate": 1.5306324110671935e-07,
31
+ "loss": 2.9104,
32
  "step": 1000
33
  },
34
  {
35
  "epoch": 2.0,
36
+ "eval_accuracy": 0.5284477427334571,
37
+ "eval_loss": 2.985973596572876,
38
+ "eval_runtime": 429.4589,
39
+ "eval_samples_per_second": 67.774,
40
+ "eval_steps_per_second": 2.119,
41
  "step": 1366
42
  },
43
  {
44
  "epoch": 2.1961932650073206,
45
+ "grad_norm": 1.7381324768066406,
46
  "learning_rate": 1.283596837944664e-07,
47
+ "loss": 2.9038,
48
  "step": 1500
49
  },
50
  {
51
  "epoch": 2.9282576866764276,
52
+ "grad_norm": 1.8419060707092285,
53
  "learning_rate": 1.0365612648221343e-07,
54
+ "loss": 2.8969,
55
  "step": 2000
56
  },
57
  {
58
  "epoch": 3.0,
59
+ "eval_accuracy": 0.5296158867587439,
60
+ "eval_loss": 2.9781196117401123,
61
+ "eval_runtime": 416.4739,
62
+ "eval_samples_per_second": 69.887,
63
+ "eval_steps_per_second": 2.185,
64
  "step": 2049
65
  },
66
  {
67
  "epoch": 3.660322108345534,
68
+ "grad_norm": 1.8417006731033325,
69
  "learning_rate": 7.895256916996047e-08,
70
+ "loss": 2.8889,
71
  "step": 2500
72
  },
73
  {
74
  "epoch": 4.0,
75
+ "eval_accuracy": 0.5304061018346733,
76
+ "eval_loss": 2.972407341003418,
77
+ "eval_runtime": 417.0986,
78
+ "eval_samples_per_second": 69.782,
79
+ "eval_steps_per_second": 2.182,
80
  "step": 2732
81
  },
82
  {
83
  "epoch": 4.392386530014641,
84
+ "grad_norm": 2.0208425521850586,
85
  "learning_rate": 5.4249011857707506e-08,
86
+ "loss": 2.8874,
87
  "step": 3000
88
  },
89
  {
90
  "epoch": 5.0,
91
+ "eval_accuracy": 0.5309901738473167,
92
+ "eval_loss": 2.969489097595215,
93
+ "eval_runtime": 410.5775,
94
+ "eval_samples_per_second": 70.89,
95
+ "eval_steps_per_second": 2.216,
96
  "step": 3415
97
  },
98
  {
99
  "epoch": 5.124450951683748,
100
+ "grad_norm": 2.0944771766662598,
101
  "learning_rate": 2.9545454545454546e-08,
102
+ "loss": 2.8839,
103
  "step": 3500
104
  },
105
  {
106
  "epoch": 5.856515373352855,
107
+ "grad_norm": 2.000408172607422,
108
  "learning_rate": 4.8418972332015805e-09,
109
+ "loss": 2.8841,
110
  "step": 4000
111
  },
112
  {
113
  "epoch": 6.0,
114
+ "eval_accuracy": 0.5313337456194599,
115
+ "eval_loss": 2.96836519241333,
116
+ "eval_runtime": 417.3097,
117
+ "eval_samples_per_second": 69.747,
118
+ "eval_steps_per_second": 2.181,
119
  "step": 4098
120
  }
121
  ],
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:923fc237a7178ad4f3cd707c2dc8fe102bafc4d70fff52937323240528eb0193
3
  size 343368556
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7584bee441a46ff02eaabaf77128796f7ce04506a497a42af795348c96b05551
3
  size 343368556
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c3c1aac80e6fe46ec431fce06da55507d3c3019a55448e3210fba2cc3f10ce0
3
  size 4603
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd420b36012d3de1b843696fecff72de7b75f1e32a6360e988cfe1bc3561f0f6
3
  size 4603