jvadlamudi2 commited on
Commit
555f0cd
1 Parent(s): 82adb67

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -6,8 +6,8 @@
6
  "eval_samples_per_second": 132.281,
7
  "eval_steps_per_second": 4.724,
8
  "total_flos": 6.716617754447462e+16,
9
- "train_loss": 0.642929474512736,
10
- "train_runtime": 92.7694,
11
- "train_samples_per_second": 28.813,
12
- "train_steps_per_second": 0.226
13
  }
 
6
  "eval_samples_per_second": 132.281,
7
  "eval_steps_per_second": 4.724,
8
  "total_flos": 6.716617754447462e+16,
9
+ "train_loss": 0.630237170628139,
10
+ "train_runtime": 87.2731,
11
+ "train_samples_per_second": 30.628,
12
+ "train_steps_per_second": 0.241
13
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3b2c2b1413b42944b9ae0df2cf346feef3026d6e754bbad15e404e814d18547
3
  size 111349029
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe733b12e80dc32a5d3038c144657e73ee755096cf10005a41955e4c27a9ff68
3
  size 111349029
runs/Jul24_17-51-34_79617dc78cd9/events.out.tfevents.1690221823.79617dc78cd9.248.16 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15cd42c63dadb6adcea864e3e1927d50f59f1c418b0fa836b32f5be3baaec530
3
+ size 4594
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
  "total_flos": 6.716617754447462e+16,
4
- "train_loss": 0.642929474512736,
5
- "train_runtime": 92.7694,
6
- "train_samples_per_second": 28.813,
7
- "train_steps_per_second": 0.226
8
  }
 
1
  {
2
  "epoch": 3.0,
3
  "total_flos": 6.716617754447462e+16,
4
+ "train_loss": 0.630237170628139,
5
+ "train_runtime": 87.2731,
6
+ "train_samples_per_second": 30.628,
7
+ "train_steps_per_second": 0.241
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.75,
3
- "best_model_checkpoint": "convnext-tiny-224-jvadlamudi2/checkpoint-21",
4
  "epoch": 3.0,
5
  "global_step": 21,
6
  "is_hyper_param_search": false,
@@ -9,51 +9,51 @@
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
- "eval_accuracy": 0.6964285714285714,
13
- "eval_loss": 0.6321507692337036,
14
- "eval_runtime": 0.9364,
15
- "eval_samples_per_second": 119.604,
16
- "eval_steps_per_second": 4.272,
17
  "step": 7
18
  },
19
  {
20
  "epoch": 1.43,
21
  "learning_rate": 3.055555555555556e-05,
22
- "loss": 0.6503,
23
  "step": 10
24
  },
25
  {
26
  "epoch": 2.0,
27
- "eval_accuracy": 0.7142857142857143,
28
- "eval_loss": 0.6245036721229553,
29
- "eval_runtime": 0.788,
30
- "eval_samples_per_second": 142.126,
31
- "eval_steps_per_second": 5.076,
32
  "step": 14
33
  },
34
  {
35
  "epoch": 2.86,
36
  "learning_rate": 2.777777777777778e-06,
37
- "loss": 0.6372,
38
  "step": 20
39
  },
40
  {
41
  "epoch": 3.0,
42
- "eval_accuracy": 0.75,
43
- "eval_loss": 0.6208862662315369,
44
- "eval_runtime": 0.7892,
45
- "eval_samples_per_second": 141.913,
46
- "eval_steps_per_second": 5.068,
47
  "step": 21
48
  },
49
  {
50
  "epoch": 3.0,
51
  "step": 21,
52
  "total_flos": 6.716617754447462e+16,
53
- "train_loss": 0.642929474512736,
54
- "train_runtime": 92.7694,
55
- "train_samples_per_second": 28.813,
56
- "train_steps_per_second": 0.226
57
  }
58
  ],
59
  "max_steps": 21,
 
1
  {
2
+ "best_metric": 0.7946428571428571,
3
+ "best_model_checkpoint": "convnext-tiny-224-jvadlamudi2/checkpoint-14",
4
  "epoch": 3.0,
5
  "global_step": 21,
6
  "is_hyper_param_search": false,
 
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
+ "eval_accuracy": 0.7678571428571429,
13
+ "eval_loss": 0.6085006594657898,
14
+ "eval_runtime": 0.7752,
15
+ "eval_samples_per_second": 144.48,
16
+ "eval_steps_per_second": 5.16,
17
  "step": 7
18
  },
19
  {
20
  "epoch": 1.43,
21
  "learning_rate": 3.055555555555556e-05,
22
+ "loss": 0.6388,
23
  "step": 10
24
  },
25
  {
26
  "epoch": 2.0,
27
+ "eval_accuracy": 0.7946428571428571,
28
+ "eval_loss": 0.5984492897987366,
29
+ "eval_runtime": 0.82,
30
+ "eval_samples_per_second": 136.58,
31
+ "eval_steps_per_second": 4.878,
32
  "step": 14
33
  },
34
  {
35
  "epoch": 2.86,
36
  "learning_rate": 2.777777777777778e-06,
37
+ "loss": 0.6218,
38
  "step": 20
39
  },
40
  {
41
  "epoch": 3.0,
42
+ "eval_accuracy": 0.7857142857142857,
43
+ "eval_loss": 0.5960062742233276,
44
+ "eval_runtime": 0.8803,
45
+ "eval_samples_per_second": 127.229,
46
+ "eval_steps_per_second": 4.544,
47
  "step": 21
48
  },
49
  {
50
  "epoch": 3.0,
51
  "step": 21,
52
  "total_flos": 6.716617754447462e+16,
53
+ "train_loss": 0.630237170628139,
54
+ "train_runtime": 87.2731,
55
+ "train_samples_per_second": 30.628,
56
+ "train_steps_per_second": 0.241
57
  }
58
  ],
59
  "max_steps": 21,