d071696 commited on
Commit
76d4e53
1 Parent(s): 7b74f5e

Training in progress, step 300

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 4.0,
3
- "eval_accuracy": 0.9963782696177063,
4
- "eval_loss": 0.012937591411173344,
5
- "eval_runtime": 48.4901,
6
- "eval_samples_per_second": 51.248,
7
- "eval_steps_per_second": 6.414,
8
  "total_flos": 7439897757745152.0,
9
- "train_loss": 2.0212895274162292,
10
- "train_runtime": 7.7329,
11
- "train_samples_per_second": 12.414,
12
- "train_steps_per_second": 1.552
13
  }
 
1
  {
2
  "epoch": 4.0,
3
+ "eval_accuracy": 0.9583333333333334,
4
+ "eval_loss": 1.039479374885559,
5
+ "eval_runtime": 1.0974,
6
+ "eval_samples_per_second": 21.87,
7
+ "eval_steps_per_second": 2.734,
8
  "total_flos": 7439897757745152.0,
9
+ "train_loss": 1.4209961891174316,
10
+ "train_runtime": 7.3487,
11
+ "train_samples_per_second": 13.064,
12
+ "train_steps_per_second": 1.089
13
  }
config.json CHANGED
@@ -9,35 +9,33 @@
9
  "hidden_dropout_prob": 0.0,
10
  "hidden_size": 768,
11
  "id2label": {
12
- "0": "carton boxes",
13
- "1": "old newspapers",
14
- "10": "used juice box",
15
- "11": "used plastic bottles labels",
16
- "2": "old newspapers with plastic bottles and plastic garbage",
17
- "3": "paper boxes and plastic trash bags",
18
- "4": "paper waste",
19
- "5": "plastic bottles",
20
- "6": "plastic bottles and plastic bags with paper boxes",
21
- "7": "plastic bottles and plastic garbage",
22
- "8": "plastic garbage",
23
- "9": "plastic garbage and paper garbage"
24
  },
25
  "image_size": 224,
26
  "initializer_range": 0.02,
27
  "intermediate_size": 3072,
28
  "label2id": {
29
- "carton boxes": "0",
30
- "old newspapers": "1",
31
- "old newspapers with plastic bottles and plastic garbage": "2",
32
- "paper boxes and plastic trash bags": "3",
33
- "paper waste": "4",
34
- "plastic bottles": "5",
35
- "plastic bottles and plastic bags with paper boxes": "6",
36
- "plastic bottles and plastic garbage": "7",
37
- "plastic garbage": "8",
38
- "plastic garbage and paper garbage": "9",
39
- "used juice box": "10",
40
- "used plastic bottles labels": "11"
41
  },
42
  "layer_norm_eps": 1e-12,
43
  "model_type": "vit",
 
9
  "hidden_dropout_prob": 0.0,
10
  "hidden_size": 768,
11
  "id2label": {
12
+ "0": "aluminium",
13
+ "1": "batteries",
14
+ "10": "takeaway cups",
15
+ "2": "cardboard",
16
+ "3": "disposable plates",
17
+ "4": "glass",
18
+ "5": "hard plastic",
19
+ "6": "paper",
20
+ "7": "paper towel",
21
+ "8": "polystyrene",
22
+ "9": "soft plastics"
 
23
  },
24
  "image_size": 224,
25
  "initializer_range": 0.02,
26
  "intermediate_size": 3072,
27
  "label2id": {
28
+ "aluminium": "0",
29
+ "batteries": "1",
30
+ "cardboard": "2",
31
+ "disposable plates": "3",
32
+ "glass": "4",
33
+ "hard plastic": "5",
34
+ "paper": "6",
35
+ "paper towel": "7",
36
+ "polystyrene": "8",
37
+ "soft plastics": "9",
38
+ "takeaway cups": "10"
 
39
  },
40
  "layer_norm_eps": 1e-12,
41
  "model_type": "vit",
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 4.0,
3
- "eval_accuracy": 0.9963782696177063,
4
- "eval_loss": 0.012937591411173344,
5
- "eval_runtime": 48.4901,
6
- "eval_samples_per_second": 51.248,
7
- "eval_steps_per_second": 6.414
8
  }
 
1
  {
2
  "epoch": 4.0,
3
+ "eval_accuracy": 0.9583333333333334,
4
+ "eval_loss": 1.039479374885559,
5
+ "eval_runtime": 1.0974,
6
+ "eval_samples_per_second": 21.87,
7
+ "eval_steps_per_second": 2.734
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:17ae2382b9eca4f52fc4d17a9cb546b8971f310d461d0e085613297c710f7ff9
3
- size 343254736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca8ca01f0c031632e2131270776a232480fdf9bfe32ab7ad11e498d1d677a5a9
3
+ size 343251660
runs/Mar29_18-51-27_X5C922065N/events.out.tfevents.1711734830.X5C922065N.77198.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb92060756fa2c4f538ca77c69a721411f79d55d3f3537b2e74a15d4cca51788
3
+ size 405
runs/Mar29_18-51-27_X5C922065N/events.out.tfevents.1711734965.X5C922065N.77198.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b64f0498695854ebda0c5046adb2a9adece839413b4b4c765764e35204ae4c2a
3
+ size 12367
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 4.0,
3
  "total_flos": 7439897757745152.0,
4
- "train_loss": 2.0212895274162292,
5
- "train_runtime": 7.7329,
6
- "train_samples_per_second": 12.414,
7
- "train_steps_per_second": 1.552
8
  }
 
1
  {
2
  "epoch": 4.0,
3
  "total_flos": 7439897757745152.0,
4
+ "train_loss": 1.4209961891174316,
5
+ "train_runtime": 7.3487,
6
+ "train_samples_per_second": 13.064,
7
+ "train_steps_per_second": 1.089
8
  }
trainer_state.json CHANGED
@@ -2,36 +2,29 @@
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
  "epoch": 4.0,
5
- "eval_steps": 1000,
6
- "global_step": 12,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
- {
12
- "epoch": 3.33,
13
- "grad_norm": 2.8058300018310547,
14
- "learning_rate": 3.3333333333333335e-05,
15
- "loss": 2.1093,
16
- "step": 10
17
- },
18
  {
19
  "epoch": 4.0,
20
- "step": 12,
21
  "total_flos": 7439897757745152.0,
22
- "train_loss": 2.0212895274162292,
23
- "train_runtime": 7.7329,
24
- "train_samples_per_second": 12.414,
25
- "train_steps_per_second": 1.552
26
  }
27
  ],
28
  "logging_steps": 10,
29
- "max_steps": 12,
30
  "num_input_tokens_seen": 0,
31
  "num_train_epochs": 4,
32
- "save_steps": 1000,
33
  "total_flos": 7439897757745152.0,
34
- "train_batch_size": 8,
35
  "trial_name": null,
36
  "trial_params": null
37
  }
 
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
  "epoch": 4.0,
5
+ "eval_steps": 100,
6
+ "global_step": 8,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
 
 
 
 
 
 
 
11
  {
12
  "epoch": 4.0,
13
+ "step": 8,
14
  "total_flos": 7439897757745152.0,
15
+ "train_loss": 1.4209961891174316,
16
+ "train_runtime": 7.3487,
17
+ "train_samples_per_second": 13.064,
18
+ "train_steps_per_second": 1.089
19
  }
20
  ],
21
  "logging_steps": 10,
22
+ "max_steps": 8,
23
  "num_input_tokens_seen": 0,
24
  "num_train_epochs": 4,
25
+ "save_steps": 100,
26
  "total_flos": 7439897757745152.0,
27
+ "train_batch_size": 16,
28
  "trial_name": null,
29
  "trial_params": null
30
  }