Kotiks commited on
Commit
bee163b
1 Parent(s): 28deffd

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.7727272727272727,
4
- "eval_loss": 0.5769956111907959,
5
- "eval_runtime": 0.3139,
6
- "eval_samples_per_second": 70.075,
7
- "eval_steps_per_second": 6.37,
8
- "total_flos": 1.4093345754980352e+16,
9
- "train_loss": 0.5933622784084744,
10
- "train_runtime": 25.6802,
11
- "train_samples_per_second": 22.079,
12
- "train_steps_per_second": 0.35
13
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "eval_accuracy": 0.7272727272727273,
4
+ "eval_loss": 0.7899118065834045,
5
+ "eval_runtime": 0.2994,
6
+ "eval_samples_per_second": 73.482,
7
+ "eval_steps_per_second": 6.68,
8
+ "total_flos": 2.348890959163392e+16,
9
+ "train_loss": 0.2989959716796875,
10
+ "train_runtime": 40.2987,
11
+ "train_samples_per_second": 23.45,
12
+ "train_steps_per_second": 0.372
13
  }
config.json CHANGED
@@ -1,18 +1,10 @@
1
  {
2
- "_name_or_path": "swin-tiny-patch4-window7-224-finetuned-eurosat-kornia",
3
  "architectures": [
4
- "SwinForImageClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.0,
7
- "depths": [
8
- 2,
9
- 2,
10
- 6,
11
- 2
12
- ],
13
- "drop_path_rate": 0.1,
14
- "embed_dim": 96,
15
- "encoder_stride": 32,
16
  "hidden_act": "gelu",
17
  "hidden_dropout_prob": 0.0,
18
  "hidden_size": 768,
@@ -22,40 +14,19 @@
22
  },
23
  "image_size": 224,
24
  "initializer_range": 0.02,
 
25
  "label2id": {
26
  "clethrionomys": 0,
27
  "sylvaemus": 1
28
  },
29
- "layer_norm_eps": 1e-05,
30
- "mlp_ratio": 4.0,
31
- "model_type": "swin",
32
  "num_channels": 3,
33
- "num_heads": [
34
- 3,
35
- 6,
36
- 12,
37
- 24
38
- ],
39
- "num_layers": 4,
40
- "out_features": [
41
- "stage4"
42
- ],
43
- "out_indices": [
44
- 4
45
- ],
46
- "patch_size": 4,
47
- "path_norm": true,
48
  "problem_type": "single_label_classification",
49
  "qkv_bias": true,
50
- "stage_names": [
51
- "stem",
52
- "stage1",
53
- "stage2",
54
- "stage3",
55
- "stage4"
56
- ],
57
  "torch_dtype": "float32",
58
- "transformers_version": "4.35.2",
59
- "use_absolute_embeddings": false,
60
- "window_size": 7
61
  }
 
1
  {
2
+ "_name_or_path": "google/vit-base-patch16-224",
3
  "architectures": [
4
+ "ViTForImageClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.0,
7
+ "encoder_stride": 16,
 
 
 
 
 
 
 
 
8
  "hidden_act": "gelu",
9
  "hidden_dropout_prob": 0.0,
10
  "hidden_size": 768,
 
14
  },
15
  "image_size": 224,
16
  "initializer_range": 0.02,
17
+ "intermediate_size": 3072,
18
  "label2id": {
19
  "clethrionomys": 0,
20
  "sylvaemus": 1
21
  },
22
+ "layer_norm_eps": 1e-12,
23
+ "model_type": "vit",
24
+ "num_attention_heads": 12,
25
  "num_channels": 3,
26
+ "num_hidden_layers": 12,
27
+ "patch_size": 16,
 
 
 
 
 
 
 
 
 
 
 
 
 
28
  "problem_type": "single_label_classification",
29
  "qkv_bias": true,
 
 
 
 
 
 
 
30
  "torch_dtype": "float32",
31
+ "transformers_version": "4.35.2"
 
 
32
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.7727272727272727,
4
- "eval_loss": 0.5769956111907959,
5
- "eval_runtime": 0.3139,
6
- "eval_samples_per_second": 70.075,
7
- "eval_steps_per_second": 6.37
8
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "eval_accuracy": 0.7272727272727273,
4
+ "eval_loss": 0.7899118065834045,
5
+ "eval_runtime": 0.2994,
6
+ "eval_samples_per_second": 73.482,
7
+ "eval_steps_per_second": 6.68
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ec318a30c4de32991c1f68e1788d705fe3084cb7ac93b333eb218baf10fa3b8e
3
- size 110342832
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14017dea4a569ea98e9e99a06667d04fb040dc086df06f0b897a9222d1e5db17
3
+ size 343223968
preprocessor_config.json CHANGED
@@ -2,19 +2,18 @@
2
  "do_normalize": true,
3
  "do_rescale": true,
4
  "do_resize": true,
5
- "feature_extractor_type": "ViTFeatureExtractor",
6
  "image_mean": [
7
- 0.485,
8
- 0.456,
9
- 0.406
10
  ],
11
- "image_processor_type": "ViTFeatureExtractor",
12
  "image_std": [
13
- 0.229,
14
- 0.224,
15
- 0.225
16
  ],
17
- "resample": 3,
18
  "rescale_factor": 0.00392156862745098,
19
  "size": {
20
  "height": 224,
 
2
  "do_normalize": true,
3
  "do_rescale": true,
4
  "do_resize": true,
 
5
  "image_mean": [
6
+ 0.5,
7
+ 0.5,
8
+ 0.5
9
  ],
10
+ "image_processor_type": "ViTImageProcessor",
11
  "image_std": [
12
+ 0.5,
13
+ 0.5,
14
+ 0.5
15
  ],
16
+ "resample": 2,
17
  "rescale_factor": 0.00392156862745098,
18
  "size": {
19
  "height": 224,
runs/Jan11_07-36-48_884473a9f125/events.out.tfevents.1704958690.884473a9f125.5987.13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b659f3536afd6f2a79d3131e8d58ce14e048d87c46191c7a514e022f43564d6
3
+ size 405
runs/Jan11_08-11-35_884473a9f125/events.out.tfevents.1704960712.884473a9f125.5987.14 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:677fe669792e570394ce0c7db69a10e3c40a073fde3c95e1f60a3af308b627ab
3
+ size 4663
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "total_flos": 1.4093345754980352e+16,
4
- "train_loss": 0.5933622784084744,
5
- "train_runtime": 25.6802,
6
- "train_samples_per_second": 22.079,
7
- "train_steps_per_second": 0.35
8
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "total_flos": 2.348890959163392e+16,
4
+ "train_loss": 0.2989959716796875,
5
+ "train_runtime": 40.2987,
6
+ "train_samples_per_second": 23.45,
7
+ "train_steps_per_second": 0.372
8
  }
trainer_state.json CHANGED
@@ -1,55 +1,79 @@
1
  {
2
- "best_metric": 0.7727272727272727,
3
- "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat-kornia/checkpoint-9",
4
- "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 9,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.2727272727272727,
14
- "eval_loss": 2.8753721714019775,
15
- "eval_runtime": 0.2391,
16
- "eval_samples_per_second": 91.995,
17
- "eval_steps_per_second": 8.363,
18
  "step": 3
19
  },
20
  {
21
  "epoch": 2.0,
22
  "eval_accuracy": 0.7272727272727273,
23
- "eval_loss": 0.5872368812561035,
24
- "eval_runtime": 0.2697,
25
- "eval_samples_per_second": 81.585,
26
- "eval_steps_per_second": 7.417,
27
  "step": 6
28
  },
29
  {
30
  "epoch": 3.0,
31
- "eval_accuracy": 0.7727272727272727,
32
- "eval_loss": 0.5769956111907959,
33
- "eval_runtime": 0.2361,
34
- "eval_samples_per_second": 93.199,
35
- "eval_steps_per_second": 8.473,
36
  "step": 9
37
  },
38
  {
39
- "epoch": 3.0,
40
- "step": 9,
41
- "total_flos": 1.4093345754980352e+16,
42
- "train_loss": 0.5933622784084744,
43
- "train_runtime": 25.6802,
44
- "train_samples_per_second": 22.079,
45
- "train_steps_per_second": 0.35
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
46
  }
47
  ],
48
  "logging_steps": 10,
49
- "max_steps": 9,
50
- "num_train_epochs": 3,
51
  "save_steps": 500,
52
- "total_flos": 1.4093345754980352e+16,
53
  "trial_name": null,
54
  "trial_params": null
55
  }
 
1
  {
2
+ "best_metric": 0.7272727272727273,
3
+ "best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-eurosat-kornia/checkpoint-6",
4
+ "epoch": 5.0,
5
  "eval_steps": 500,
6
+ "global_step": 15,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.5454545454545454,
14
+ "eval_loss": 1.666408658027649,
15
+ "eval_runtime": 0.2367,
16
+ "eval_samples_per_second": 92.955,
17
+ "eval_steps_per_second": 8.45,
18
  "step": 3
19
  },
20
  {
21
  "epoch": 2.0,
22
  "eval_accuracy": 0.7272727272727273,
23
+ "eval_loss": 0.7899118065834045,
24
+ "eval_runtime": 0.3107,
25
+ "eval_samples_per_second": 70.812,
26
+ "eval_steps_per_second": 6.437,
27
  "step": 6
28
  },
29
  {
30
  "epoch": 3.0,
31
+ "eval_accuracy": 0.7272727272727273,
32
+ "eval_loss": 0.770358145236969,
33
+ "eval_runtime": 0.2398,
34
+ "eval_samples_per_second": 91.755,
35
+ "eval_steps_per_second": 8.341,
36
  "step": 9
37
  },
38
  {
39
+ "epoch": 3.33,
40
+ "learning_rate": 1.923076923076923e-05,
41
+ "loss": 0.3108,
42
+ "step": 10
43
+ },
44
+ {
45
+ "epoch": 4.0,
46
+ "eval_accuracy": 0.7272727272727273,
47
+ "eval_loss": 0.6269326210021973,
48
+ "eval_runtime": 0.2432,
49
+ "eval_samples_per_second": 90.452,
50
+ "eval_steps_per_second": 8.223,
51
+ "step": 12
52
+ },
53
+ {
54
+ "epoch": 5.0,
55
+ "eval_accuracy": 0.6818181818181818,
56
+ "eval_loss": 0.644472062587738,
57
+ "eval_runtime": 0.2431,
58
+ "eval_samples_per_second": 90.505,
59
+ "eval_steps_per_second": 8.228,
60
+ "step": 15
61
+ },
62
+ {
63
+ "epoch": 5.0,
64
+ "step": 15,
65
+ "total_flos": 2.348890959163392e+16,
66
+ "train_loss": 0.2989959716796875,
67
+ "train_runtime": 40.2987,
68
+ "train_samples_per_second": 23.45,
69
+ "train_steps_per_second": 0.372
70
  }
71
  ],
72
  "logging_steps": 10,
73
+ "max_steps": 15,
74
+ "num_train_epochs": 5,
75
  "save_steps": 500,
76
+ "total_flos": 2.348890959163392e+16,
77
  "trial_name": null,
78
  "trial_params": null
79
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91266273ddd1721eb2e4f402a434c3d9fdf79c26e993dbc9f212a32c572151d8
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac99b8d429f786afbe2368d73a7192ac7df9ec55a0e50f269048b862ba068f40
3
  size 4664