Training in progress, epoch 1, checkpoint
Browse files- checkpoint-107/config.json +69 -69
- checkpoint-107/model.safetensors +1 -1
- checkpoint-107/optimizer.pt +2 -2
- checkpoint-107/preprocessor_config.json +26 -47
- checkpoint-107/rng_state.pth +2 -2
- checkpoint-107/scheduler.pt +1 -1
- checkpoint-107/trainer_state.json +93 -93
- checkpoint-107/training_args.bin +2 -2
checkpoint-107/config.json
CHANGED
@@ -1,69 +1,69 @@
|
|
1 |
-
{
|
2 |
-
"_name_or_path": "microsoft/conditional-detr-resnet-50",
|
3 |
-
"activation_dropout": 0.0,
|
4 |
-
"activation_function": "relu",
|
5 |
-
"architectures": [
|
6 |
-
"ConditionalDetrForObjectDetection"
|
7 |
-
],
|
8 |
-
"attention_dropout": 0.0,
|
9 |
-
"auxiliary_loss": false,
|
10 |
-
"backbone": "resnet50",
|
11 |
-
"backbone_config": null,
|
12 |
-
"backbone_kwargs": {
|
13 |
-
"in_chans": 3,
|
14 |
-
"out_indices": [
|
15 |
-
1,
|
16 |
-
2,
|
17 |
-
3,
|
18 |
-
4
|
19 |
-
]
|
20 |
-
},
|
21 |
-
"bbox_cost": 5,
|
22 |
-
"bbox_loss_coefficient": 5,
|
23 |
-
"class_cost": 2,
|
24 |
-
"cls_loss_coefficient": 2,
|
25 |
-
"d_model": 256,
|
26 |
-
"decoder_attention_heads": 8,
|
27 |
-
"decoder_ffn_dim": 2048,
|
28 |
-
"decoder_layerdrop": 0.0,
|
29 |
-
"decoder_layers": 6,
|
30 |
-
"dice_loss_coefficient": 1,
|
31 |
-
"dilation": false,
|
32 |
-
"dropout": 0.1,
|
33 |
-
"encoder_attention_heads": 8,
|
34 |
-
"encoder_ffn_dim": 2048,
|
35 |
-
"encoder_layerdrop": 0.0,
|
36 |
-
"encoder_layers": 6,
|
37 |
-
"focal_alpha": 0.25,
|
38 |
-
"giou_cost": 2,
|
39 |
-
"giou_loss_coefficient": 2,
|
40 |
-
"id2label": {
|
41 |
-
"0": "Coverall",
|
42 |
-
"1": "Face_Shield",
|
43 |
-
"2": "Gloves",
|
44 |
-
"3": "Goggles",
|
45 |
-
"4": "Mask"
|
46 |
-
},
|
47 |
-
"init_std": 0.02,
|
48 |
-
"init_xavier_std": 1.0,
|
49 |
-
"is_encoder_decoder": true,
|
50 |
-
"label2id": {
|
51 |
-
"Coverall": 0,
|
52 |
-
"Face_Shield": 1,
|
53 |
-
"Gloves": 2,
|
54 |
-
"Goggles": 3,
|
55 |
-
"Mask": 4
|
56 |
-
},
|
57 |
-
"mask_loss_coefficient": 1,
|
58 |
-
"max_position_embeddings": 1024,
|
59 |
-
"model_type": "conditional_detr",
|
60 |
-
"num_channels": 3,
|
61 |
-
"num_hidden_layers": 6,
|
62 |
-
"num_queries": 300,
|
63 |
-
"position_embedding_type": "sine",
|
64 |
-
"scale_embedding": false,
|
65 |
-
"torch_dtype": "float32",
|
66 |
-
"transformers_version": "4.42.
|
67 |
-
"use_pretrained_backbone": true,
|
68 |
-
"use_timm_backbone": true
|
69 |
-
}
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "microsoft/conditional-detr-resnet-50",
|
3 |
+
"activation_dropout": 0.0,
|
4 |
+
"activation_function": "relu",
|
5 |
+
"architectures": [
|
6 |
+
"ConditionalDetrForObjectDetection"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.0,
|
9 |
+
"auxiliary_loss": false,
|
10 |
+
"backbone": "resnet50",
|
11 |
+
"backbone_config": null,
|
12 |
+
"backbone_kwargs": {
|
13 |
+
"in_chans": 3,
|
14 |
+
"out_indices": [
|
15 |
+
1,
|
16 |
+
2,
|
17 |
+
3,
|
18 |
+
4
|
19 |
+
]
|
20 |
+
},
|
21 |
+
"bbox_cost": 5,
|
22 |
+
"bbox_loss_coefficient": 5,
|
23 |
+
"class_cost": 2,
|
24 |
+
"cls_loss_coefficient": 2,
|
25 |
+
"d_model": 256,
|
26 |
+
"decoder_attention_heads": 8,
|
27 |
+
"decoder_ffn_dim": 2048,
|
28 |
+
"decoder_layerdrop": 0.0,
|
29 |
+
"decoder_layers": 6,
|
30 |
+
"dice_loss_coefficient": 1,
|
31 |
+
"dilation": false,
|
32 |
+
"dropout": 0.1,
|
33 |
+
"encoder_attention_heads": 8,
|
34 |
+
"encoder_ffn_dim": 2048,
|
35 |
+
"encoder_layerdrop": 0.0,
|
36 |
+
"encoder_layers": 6,
|
37 |
+
"focal_alpha": 0.25,
|
38 |
+
"giou_cost": 2,
|
39 |
+
"giou_loss_coefficient": 2,
|
40 |
+
"id2label": {
|
41 |
+
"0": "Coverall",
|
42 |
+
"1": "Face_Shield",
|
43 |
+
"2": "Gloves",
|
44 |
+
"3": "Goggles",
|
45 |
+
"4": "Mask"
|
46 |
+
},
|
47 |
+
"init_std": 0.02,
|
48 |
+
"init_xavier_std": 1.0,
|
49 |
+
"is_encoder_decoder": true,
|
50 |
+
"label2id": {
|
51 |
+
"Coverall": 0,
|
52 |
+
"Face_Shield": 1,
|
53 |
+
"Gloves": 2,
|
54 |
+
"Goggles": 3,
|
55 |
+
"Mask": 4
|
56 |
+
},
|
57 |
+
"mask_loss_coefficient": 1,
|
58 |
+
"max_position_embeddings": 1024,
|
59 |
+
"model_type": "conditional_detr",
|
60 |
+
"num_channels": 3,
|
61 |
+
"num_hidden_layers": 6,
|
62 |
+
"num_queries": 300,
|
63 |
+
"position_embedding_type": "sine",
|
64 |
+
"scale_embedding": false,
|
65 |
+
"torch_dtype": "float32",
|
66 |
+
"transformers_version": "4.42.4",
|
67 |
+
"use_pretrained_backbone": true,
|
68 |
+
"use_timm_backbone": true
|
69 |
+
}
|
checkpoint-107/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 174079796
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0e73b52bd487fe68f9122ef8b954c6bc5b4e68351aaa78a20de44f8b42d1693
|
3 |
size 174079796
|
checkpoint-107/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93d99a373e4f0a6a9bdc55bb77fa36619ec34f8e95385249c63aedc7abc5e956
|
3 |
+
size 345697817
|
checkpoint-107/preprocessor_config.json
CHANGED
@@ -1,47 +1,26 @@
|
|
1 |
-
{
|
2 |
-
"
|
3 |
-
|
4 |
-
|
5 |
-
|
6 |
-
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
11 |
-
|
12 |
-
|
13 |
-
|
14 |
-
|
15 |
-
|
16 |
-
|
17 |
-
|
18 |
-
|
19 |
-
|
20 |
-
|
21 |
-
|
22 |
-
|
23 |
-
|
24 |
-
|
25 |
-
|
26 |
-
|
27 |
-
"do_resize": false,
|
28 |
-
"format": "coco_detection",
|
29 |
-
"image_mean": [
|
30 |
-
0.485,
|
31 |
-
0.456,
|
32 |
-
0.406
|
33 |
-
],
|
34 |
-
"image_processor_type": "ConditionalDetrImageProcessor",
|
35 |
-
"image_std": [
|
36 |
-
0.229,
|
37 |
-
0.224,
|
38 |
-
0.225
|
39 |
-
],
|
40 |
-
"pad_size": null,
|
41 |
-
"resample": 2,
|
42 |
-
"rescale_factor": 0.00392156862745098,
|
43 |
-
"size": {
|
44 |
-
"longest_edge": 1333,
|
45 |
-
"shortest_edge": 800
|
46 |
-
}
|
47 |
-
}
|
|
|
1 |
+
{
|
2 |
+
"do_convert_annotations": true,
|
3 |
+
"do_normalize": true,
|
4 |
+
"do_pad": false,
|
5 |
+
"do_rescale": true,
|
6 |
+
"do_resize": false,
|
7 |
+
"format": "coco_detection",
|
8 |
+
"image_mean": [
|
9 |
+
0.485,
|
10 |
+
0.456,
|
11 |
+
0.406
|
12 |
+
],
|
13 |
+
"image_processor_type": "ConditionalDetrImageProcessor",
|
14 |
+
"image_std": [
|
15 |
+
0.229,
|
16 |
+
0.224,
|
17 |
+
0.225
|
18 |
+
],
|
19 |
+
"pad_size": null,
|
20 |
+
"resample": 2,
|
21 |
+
"rescale_factor": 0.00392156862745098,
|
22 |
+
"size": {
|
23 |
+
"longest_edge": 1333,
|
24 |
+
"shortest_edge": 800
|
25 |
+
}
|
26 |
+
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
checkpoint-107/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c96e01c4478ce452b19c3ac871fcae8ffc9ff5adff345b47347e9222ef89609e
|
3 |
+
size 14244
|
checkpoint-107/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c71b99b3bd76330e6a5aae2cdf3df1f34ce8d9f90031a6793ce1e0abac2e6f7
|
3 |
size 1064
|
checkpoint-107/trainer_state.json
CHANGED
@@ -1,93 +1,93 @@
|
|
1 |
-
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "test_detr_finetuned_cppe5
|
4 |
-
"epoch": 1.0,
|
5 |
-
"eval_steps": 500,
|
6 |
-
"global_step": 107,
|
7 |
-
"is_hyper_param_search": false,
|
8 |
-
"is_local_process_zero": true,
|
9 |
-
"is_world_process_zero": true,
|
10 |
-
"log_history": [
|
11 |
-
{
|
12 |
-
"epoch": 1.0,
|
13 |
-
"step": 107,
|
14 |
-
"train_loss":
|
15 |
-
"train_map": 0.
|
16 |
-
"train_map_50": 0.
|
17 |
-
"train_map_75": 0.
|
18 |
-
"train_map_Coverall": 0.
|
19 |
-
"train_map_Face_Shield": 0.
|
20 |
-
"train_map_Gloves": 0.
|
21 |
-
"train_map_Goggles": 0.0,
|
22 |
-
"train_map_Mask": 0.
|
23 |
-
"train_map_large": 0.
|
24 |
-
"train_map_medium": 0.
|
25 |
-
"train_map_small": 0.
|
26 |
-
"train_mar_1": 0.
|
27 |
-
"train_mar_10": 0.
|
28 |
-
"train_mar_100": 0.
|
29 |
-
"train_mar_100_Coverall": 0.
|
30 |
-
"train_mar_100_Face_Shield": 0.
|
31 |
-
"train_mar_100_Gloves": 0.
|
32 |
-
"train_mar_100_Goggles": 0.
|
33 |
-
"train_mar_100_Mask": 0.
|
34 |
-
"train_mar_large": 0.
|
35 |
-
"train_mar_medium": 0.
|
36 |
-
"train_mar_small": 0.
|
37 |
-
"train_runtime":
|
38 |
-
"train_samples_per_second":
|
39 |
-
"train_steps_per_second":
|
40 |
-
},
|
41 |
-
{
|
42 |
-
"epoch": 1.0,
|
43 |
-
"eval_loss":
|
44 |
-
"eval_map": 0.
|
45 |
-
"eval_map_50": 0.
|
46 |
-
"eval_map_75": 0.
|
47 |
-
"eval_map_Coverall": 0.
|
48 |
-
"eval_map_Face_Shield": 0.
|
49 |
-
"eval_map_Gloves": 0.
|
50 |
-
"eval_map_Goggles": 0.
|
51 |
-
"eval_map_Mask": 0.
|
52 |
-
"eval_map_large": 0.
|
53 |
-
"eval_map_medium": 0.
|
54 |
-
"eval_map_small": 0.
|
55 |
-
"eval_mar_1": 0.
|
56 |
-
"eval_mar_10": 0.
|
57 |
-
"eval_mar_100": 0.
|
58 |
-
"eval_mar_100_Coverall": 0.
|
59 |
-
"eval_mar_100_Face_Shield": 0.
|
60 |
-
"eval_mar_100_Gloves": 0.
|
61 |
-
"eval_mar_100_Goggles": 0.
|
62 |
-
"eval_mar_100_Mask": 0.
|
63 |
-
"eval_mar_large": 0.
|
64 |
-
"eval_mar_medium": 0.
|
65 |
-
"eval_mar_small": 0.
|
66 |
-
"eval_runtime":
|
67 |
-
"eval_samples_per_second":
|
68 |
-
"eval_steps_per_second":
|
69 |
-
"step": 107
|
70 |
-
}
|
71 |
-
],
|
72 |
-
"logging_steps": 500,
|
73 |
-
"max_steps": 10700,
|
74 |
-
"num_input_tokens_seen": 0,
|
75 |
-
"num_train_epochs": 100,
|
76 |
-
"save_steps": 500,
|
77 |
-
"stateful_callbacks": {
|
78 |
-
"TrainerControl": {
|
79 |
-
"args": {
|
80 |
-
"should_epoch_stop": false,
|
81 |
-
"should_evaluate": false,
|
82 |
-
"should_log": false,
|
83 |
-
"should_save": true,
|
84 |
-
"should_training_stop": false
|
85 |
-
},
|
86 |
-
"attributes": {}
|
87 |
-
}
|
88 |
-
},
|
89 |
-
"total_flos": 1.5270643231488e+17,
|
90 |
-
"train_batch_size": 8,
|
91 |
-
"trial_name": null,
|
92 |
-
"trial_params": null
|
93 |
-
}
|
|
|
1 |
+
{
|
2 |
+
"best_metric": 0.0229,
|
3 |
+
"best_model_checkpoint": "test_detr_finetuned_cppe5\\checkpoint-107",
|
4 |
+
"epoch": 1.0,
|
5 |
+
"eval_steps": 500,
|
6 |
+
"global_step": 107,
|
7 |
+
"is_hyper_param_search": false,
|
8 |
+
"is_local_process_zero": true,
|
9 |
+
"is_world_process_zero": true,
|
10 |
+
"log_history": [
|
11 |
+
{
|
12 |
+
"epoch": 1.0,
|
13 |
+
"step": 107,
|
14 |
+
"train_loss": 2.4489498138427734,
|
15 |
+
"train_map": 0.0345,
|
16 |
+
"train_map_50": 0.0655,
|
17 |
+
"train_map_75": 0.0342,
|
18 |
+
"train_map_Coverall": 0.1469,
|
19 |
+
"train_map_Face_Shield": 0.0001,
|
20 |
+
"train_map_Gloves": 0.0053,
|
21 |
+
"train_map_Goggles": 0.0,
|
22 |
+
"train_map_Mask": 0.0204,
|
23 |
+
"train_map_large": 0.0326,
|
24 |
+
"train_map_medium": 0.0085,
|
25 |
+
"train_map_small": 0.0026,
|
26 |
+
"train_mar_1": 0.0855,
|
27 |
+
"train_mar_10": 0.1663,
|
28 |
+
"train_mar_100": 0.2076,
|
29 |
+
"train_mar_100_Coverall": 0.5511,
|
30 |
+
"train_mar_100_Face_Shield": 0.0052,
|
31 |
+
"train_mar_100_Gloves": 0.2184,
|
32 |
+
"train_mar_100_Goggles": 0.0097,
|
33 |
+
"train_mar_100_Mask": 0.2535,
|
34 |
+
"train_mar_large": 0.3274,
|
35 |
+
"train_mar_medium": 0.1339,
|
36 |
+
"train_mar_small": 0.0219,
|
37 |
+
"train_runtime": 29.1905,
|
38 |
+
"train_samples_per_second": 29.119,
|
39 |
+
"train_steps_per_second": 3.666
|
40 |
+
},
|
41 |
+
{
|
42 |
+
"epoch": 1.0,
|
43 |
+
"eval_loss": 2.5123209953308105,
|
44 |
+
"eval_map": 0.0229,
|
45 |
+
"eval_map_50": 0.0502,
|
46 |
+
"eval_map_75": 0.0195,
|
47 |
+
"eval_map_Coverall": 0.0993,
|
48 |
+
"eval_map_Face_Shield": 0.0003,
|
49 |
+
"eval_map_Gloves": 0.0038,
|
50 |
+
"eval_map_Goggles": 0.0002,
|
51 |
+
"eval_map_Mask": 0.0109,
|
52 |
+
"eval_map_large": 0.0247,
|
53 |
+
"eval_map_medium": 0.0069,
|
54 |
+
"eval_map_small": 0.0024,
|
55 |
+
"eval_mar_1": 0.061,
|
56 |
+
"eval_mar_10": 0.1307,
|
57 |
+
"eval_mar_100": 0.1723,
|
58 |
+
"eval_mar_100_Coverall": 0.4779,
|
59 |
+
"eval_mar_100_Face_Shield": 0.0152,
|
60 |
+
"eval_mar_100_Gloves": 0.1562,
|
61 |
+
"eval_mar_100_Goggles": 0.0185,
|
62 |
+
"eval_mar_100_Mask": 0.1938,
|
63 |
+
"eval_mar_large": 0.3415,
|
64 |
+
"eval_mar_medium": 0.1271,
|
65 |
+
"eval_mar_small": 0.0166,
|
66 |
+
"eval_runtime": 11.5313,
|
67 |
+
"eval_samples_per_second": 13.008,
|
68 |
+
"eval_steps_per_second": 1.648,
|
69 |
+
"step": 107
|
70 |
+
}
|
71 |
+
],
|
72 |
+
"logging_steps": 500,
|
73 |
+
"max_steps": 10700,
|
74 |
+
"num_input_tokens_seen": 0,
|
75 |
+
"num_train_epochs": 100,
|
76 |
+
"save_steps": 500,
|
77 |
+
"stateful_callbacks": {
|
78 |
+
"TrainerControl": {
|
79 |
+
"args": {
|
80 |
+
"should_epoch_stop": false,
|
81 |
+
"should_evaluate": false,
|
82 |
+
"should_log": false,
|
83 |
+
"should_save": true,
|
84 |
+
"should_training_stop": false
|
85 |
+
},
|
86 |
+
"attributes": {}
|
87 |
+
}
|
88 |
+
},
|
89 |
+
"total_flos": 1.5270643231488e+17,
|
90 |
+
"train_batch_size": 8,
|
91 |
+
"trial_name": null,
|
92 |
+
"trial_params": null
|
93 |
+
}
|
checkpoint-107/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fec926f50e96773b99e04d57819f5ac08d83a45048d26a31f3b9c2098e2492b
|
3 |
+
size 5112
|