t1msan commited on
Commit
5b91158
·
verified ·
1 Parent(s): 4d27732

End of training

Browse files
README.md CHANGED
@@ -15,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  This model was trained from scratch on the imagefolder dataset.
17
  It achieves the following results on the evaluation set:
18
- - Loss: 0.0949
19
 
20
  ## Model description
21
 
@@ -49,11 +49,11 @@ The following hyperparameters were used during training:
49
 
50
  | Training Loss | Epoch | Step | Validation Loss |
51
  |:-------------:|:-----:|:----:|:---------------:|
52
- | No log | 0.84 | 4 | 0.1084 |
53
- | No log | 1.89 | 9 | 0.0994 |
54
- | 0.0064 | 2.95 | 14 | 0.1109 |
55
- | 0.0064 | 4.0 | 19 | 0.0949 |
56
- | 0.0594 | 4.21 | 20 | 0.0992 |
57
 
58
 
59
  ### Framework versions
 
15
 
16
  This model was trained from scratch on the imagefolder dataset.
17
  It achieves the following results on the evaluation set:
18
+ - Loss: 0.1355
19
 
20
  ## Model description
21
 
 
49
 
50
  | Training Loss | Epoch | Step | Validation Loss |
51
  |:-------------:|:-----:|:----:|:---------------:|
52
+ | No log | 0.84 | 4 | 0.6557 |
53
+ | No log | 1.89 | 9 | 0.1355 |
54
+ | 0.0289 | 2.95 | 14 | 0.2163 |
55
+ | 0.0289 | 4.0 | 19 | 0.1560 |
56
+ | 0.0616 | 4.21 | 20 | 0.1556 |
57
 
58
 
59
  ### Framework versions
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 4.21,
3
- "eval_loss": 0.09485718607902527,
4
- "eval_runtime": 2.2406,
5
- "eval_samples_per_second": 58.913,
6
- "eval_steps_per_second": 1.339,
7
  "total_flos": 1.2713250126082867e+17,
8
- "train_loss": 0.03291104771196842,
9
- "train_runtime": 113.6566,
10
- "train_samples_per_second": 51.911,
11
- "train_steps_per_second": 0.176
12
  }
 
1
  {
2
  "epoch": 4.21,
3
+ "eval_loss": 0.1355326622724533,
4
+ "eval_runtime": 2.2928,
5
+ "eval_samples_per_second": 57.572,
6
+ "eval_steps_per_second": 1.308,
7
  "total_flos": 1.2713250126082867e+17,
8
+ "train_loss": 0.04524529278278351,
9
+ "train_runtime": 114.2042,
10
+ "train_samples_per_second": 51.662,
11
+ "train_steps_per_second": 0.175
12
  }
eval_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 4.21,
3
- "eval_loss": 0.09485718607902527,
4
- "eval_runtime": 2.2406,
5
- "eval_samples_per_second": 58.913,
6
- "eval_steps_per_second": 1.339
7
  }
 
1
  {
2
  "epoch": 4.21,
3
+ "eval_loss": 0.1355326622724533,
4
+ "eval_runtime": 2.2928,
5
+ "eval_samples_per_second": 57.572,
6
+ "eval_steps_per_second": 1.308
7
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e9ffcaa5e45c4cc241ef9b0880f7ec96d36e1e368f732afc02666f0a5a311a4
3
  size 113412768
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6015446eefc0b825750f160d47825ece7ec95ec20cd49b985d526e5633dfeb6f
3
  size 113412768
runs/Apr21_17-38-15_51d30877b6e2/events.out.tfevents.1713721096.51d30877b6e2.34.10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f546fa98badbc34e21070094589ca3e3fa57479f46adc606c9006e7e4967bcd
3
+ size 76237
runs/Apr21_17-38-15_51d30877b6e2/events.out.tfevents.1713721213.51d30877b6e2.34.11 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad8bf345f3bb8bcb748c3156f2913ed67adb5f9d8a5ef0f9d870d31f85cf2ac2
3
+ size 354
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 4.21,
3
  "total_flos": 1.2713250126082867e+17,
4
- "train_loss": 0.03291104771196842,
5
- "train_runtime": 113.6566,
6
- "train_samples_per_second": 51.911,
7
- "train_steps_per_second": 0.176
8
  }
 
1
  {
2
  "epoch": 4.21,
3
  "total_flos": 1.2713250126082867e+17,
4
+ "train_loss": 0.04524529278278351,
5
+ "train_runtime": 114.2042,
6
+ "train_samples_per_second": 51.662,
7
+ "train_steps_per_second": 0.175
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.09485718607902527,
3
- "best_model_checkpoint": "microsoft/swin-tiny-patch4-window7-224/checkpoint-19",
4
  "epoch": 4.2105263157894735,
5
  "eval_steps": 500,
6
  "global_step": 20,
@@ -10,66 +10,66 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.84,
13
- "eval_loss": 0.10838964581489563,
14
- "eval_runtime": 2.1432,
15
- "eval_samples_per_second": 61.591,
16
- "eval_steps_per_second": 1.4,
17
  "step": 4
18
  },
19
  {
20
  "epoch": 1.89,
21
- "eval_loss": 0.0993674173951149,
22
- "eval_runtime": 2.1471,
23
- "eval_samples_per_second": 61.478,
24
- "eval_steps_per_second": 1.397,
25
  "step": 9
26
  },
27
  {
28
  "epoch": 2.11,
29
- "grad_norm": 5.258437633514404,
30
  "learning_rate": 2.777777777777778e-05,
31
- "loss": 0.0064,
32
  "step": 10
33
  },
34
  {
35
  "epoch": 2.95,
36
- "eval_loss": 0.11093668639659882,
37
- "eval_runtime": 2.1002,
38
- "eval_samples_per_second": 62.851,
39
- "eval_steps_per_second": 1.428,
40
  "step": 14
41
  },
42
  {
43
  "epoch": 4.0,
44
- "eval_loss": 0.09485718607902527,
45
- "eval_runtime": 2.1285,
46
- "eval_samples_per_second": 62.014,
47
- "eval_steps_per_second": 1.409,
48
  "step": 19
49
  },
50
  {
51
  "epoch": 4.21,
52
- "grad_norm": 12.606084823608398,
53
  "learning_rate": 0.0,
54
- "loss": 0.0594,
55
  "step": 20
56
  },
57
  {
58
  "epoch": 4.21,
59
- "eval_loss": 0.09918802976608276,
60
- "eval_runtime": 2.1364,
61
- "eval_samples_per_second": 61.786,
62
- "eval_steps_per_second": 1.404,
63
  "step": 20
64
  },
65
  {
66
  "epoch": 4.21,
67
  "step": 20,
68
  "total_flos": 1.2713250126082867e+17,
69
- "train_loss": 0.03291104771196842,
70
- "train_runtime": 113.6566,
71
- "train_samples_per_second": 51.911,
72
- "train_steps_per_second": 0.176
73
  }
74
  ],
75
  "logging_steps": 10,
 
1
  {
2
+ "best_metric": 0.1355326622724533,
3
+ "best_model_checkpoint": "microsoft/swin-tiny-patch4-window7-224/checkpoint-9",
4
  "epoch": 4.2105263157894735,
5
  "eval_steps": 500,
6
  "global_step": 20,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.84,
13
+ "eval_loss": 0.6557008028030396,
14
+ "eval_runtime": 2.3009,
15
+ "eval_samples_per_second": 57.37,
16
+ "eval_steps_per_second": 1.304,
17
  "step": 4
18
  },
19
  {
20
  "epoch": 1.89,
21
+ "eval_loss": 0.1355326622724533,
22
+ "eval_runtime": 2.1272,
23
+ "eval_samples_per_second": 62.052,
24
+ "eval_steps_per_second": 1.41,
25
  "step": 9
26
  },
27
  {
28
  "epoch": 2.11,
29
+ "grad_norm": 11.091564178466797,
30
  "learning_rate": 2.777777777777778e-05,
31
+ "loss": 0.0289,
32
  "step": 10
33
  },
34
  {
35
  "epoch": 2.95,
36
+ "eval_loss": 0.21629740297794342,
37
+ "eval_runtime": 2.0797,
38
+ "eval_samples_per_second": 63.472,
39
+ "eval_steps_per_second": 1.443,
40
  "step": 14
41
  },
42
  {
43
  "epoch": 4.0,
44
+ "eval_loss": 0.1559712290763855,
45
+ "eval_runtime": 2.1584,
46
+ "eval_samples_per_second": 61.156,
47
+ "eval_steps_per_second": 1.39,
48
  "step": 19
49
  },
50
  {
51
  "epoch": 4.21,
52
+ "grad_norm": 14.637483596801758,
53
  "learning_rate": 0.0,
54
+ "loss": 0.0616,
55
  "step": 20
56
  },
57
  {
58
  "epoch": 4.21,
59
+ "eval_loss": 0.15557000041007996,
60
+ "eval_runtime": 2.0834,
61
+ "eval_samples_per_second": 63.359,
62
+ "eval_steps_per_second": 1.44,
63
  "step": 20
64
  },
65
  {
66
  "epoch": 4.21,
67
  "step": 20,
68
  "total_flos": 1.2713250126082867e+17,
69
+ "train_loss": 0.04524529278278351,
70
+ "train_runtime": 114.2042,
71
+ "train_samples_per_second": 51.662,
72
+ "train_steps_per_second": 0.175
73
  }
74
  ],
75
  "logging_steps": 10,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4136ad41440be17e9854998fa3ee1ff6230f98cf3848dc429e89c05f04c4b4c
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:955fbccfb056fd45980d796c9bd392d21f7f68a03856b0e6d69e15cf1c7c4bd1
3
  size 4984