johanhag commited on
Commit
1c93e00
1 Parent(s): 2887686

End of training

Browse files
Files changed (4) hide show
  1. README.md +80 -0
  2. config.json +88 -0
  3. model.safetensors +3 -0
  4. training_args.bin +3 -0
README.md ADDED
@@ -0,0 +1,80 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: other
3
+ base_model: nvidia/mit-b0
4
+ tags:
5
+ - vision
6
+ - image-segmentation
7
+ - generated_from_trainer
8
+ model-index:
9
+ - name: segformer-b0-winter_2
10
+ results: []
11
+ ---
12
+
13
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
14
+ should probably proofread and complete it, then remove this comment. -->
15
+
16
+ # segformer-b0-winter_2
17
+
18
+ This model is a fine-tuned version of [nvidia/mit-b0](https://huggingface.co/nvidia/mit-b0) on the johanhag/winter dataset.
19
+ It achieves the following results on the evaluation set:
20
+ - Loss: 1.0535
21
+ - Mean Iou: 0.3344
22
+ - Mean Accuracy: 0.4082
23
+ - Overall Accuracy: 0.8584
24
+ - Accuracy Unlabeled: nan
25
+ - Accuracy Road: 0.5791
26
+ - Accuracy Side walk: 0.1367
27
+ - Accuracy Car: 0.7716
28
+ - Accuracy Pedestrian: 0.0
29
+ - Accuracy Sign: 0.0
30
+ - Accuracy Other: 0.9616
31
+ - Iou Unlabeled: nan
32
+ - Iou Road: 0.4852
33
+ - Iou Side walk: 0.1124
34
+ - Iou Car: 0.5493
35
+ - Iou Pedestrian: 0.0
36
+ - Iou Sign: 0.0
37
+ - Iou Other: 0.8593
38
+
39
+ ## Model description
40
+
41
+ More information needed
42
+
43
+ ## Intended uses & limitations
44
+
45
+ More information needed
46
+
47
+ ## Training and evaluation data
48
+
49
+ More information needed
50
+
51
+ ## Training procedure
52
+
53
+ ### Training hyperparameters
54
+
55
+ The following hyperparameters were used during training:
56
+ - learning_rate: 6e-05
57
+ - train_batch_size: 2
58
+ - eval_batch_size: 2
59
+ - seed: 42
60
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
61
+ - lr_scheduler_type: linear
62
+ - num_epochs: 2
63
+
64
+ ### Training results
65
+
66
+ | Training Loss | Epoch | Step | Validation Loss | Mean Iou | Mean Accuracy | Overall Accuracy | Accuracy Unlabeled | Accuracy Road | Accuracy Side walk | Accuracy Car | Accuracy Pedestrian | Accuracy Sign | Accuracy Other | Iou Unlabeled | Iou Road | Iou Side walk | Iou Car | Iou Pedestrian | Iou Sign | Iou Other |
67
+ |:-------------:|:-----:|:----:|:---------------:|:--------:|:-------------:|:----------------:|:------------------:|:-------------:|:------------------:|:------------:|:-------------------:|:-------------:|:--------------:|:-------------:|:--------:|:-------------:|:-------:|:--------------:|:--------:|:---------:|
68
+ | 1.5205 | 0.37 | 20 | 1.7165 | 0.2199 | 0.4062 | 0.7410 | nan | 0.6131 | 0.0612 | 0.8217 | 0.0191 | 0.1249 | 0.7972 | 0.0 | 0.4142 | 0.0255 | 0.3422 | 0.0160 | 0.0075 | 0.7342 |
69
+ | 1.206 | 0.74 | 40 | 1.3022 | 0.2637 | 0.3793 | 0.8243 | nan | 0.6081 | 0.1049 | 0.6391 | 0.0083 | 0.0 | 0.9156 | 0.0 | 0.4387 | 0.0670 | 0.5111 | 0.0083 | 0.0 | 0.8211 |
70
+ | 0.9859 | 1.11 | 60 | 1.1535 | 0.2756 | 0.4094 | 0.8356 | nan | 0.6077 | 0.2204 | 0.7029 | 0.0 | 0.0 | 0.9254 | 0.0 | 0.4650 | 0.1159 | 0.5125 | 0.0 | 0.0 | 0.8359 |
71
+ | 0.9968 | 1.48 | 80 | 1.0899 | 0.3171 | 0.3962 | 0.8452 | nan | 0.5982 | 0.0850 | 0.7523 | 0.0 | 0.0 | 0.9416 | nan | 0.4673 | 0.0643 | 0.5239 | 0.0 | 0.0 | 0.8468 |
72
+ | 0.92 | 1.85 | 100 | 1.0535 | 0.3344 | 0.4082 | 0.8584 | nan | 0.5791 | 0.1367 | 0.7716 | 0.0 | 0.0 | 0.9616 | nan | 0.4852 | 0.1124 | 0.5493 | 0.0 | 0.0 | 0.8593 |
73
+
74
+
75
+ ### Framework versions
76
+
77
+ - Transformers 4.36.2
78
+ - Pytorch 2.1.2+cu121
79
+ - Datasets 2.16.1
80
+ - Tokenizers 0.15.0
config.json ADDED
@@ -0,0 +1,88 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "nvidia/mit-b0",
3
+ "architectures": [
4
+ "SegformerForSemanticSegmentation"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.0,
7
+ "classifier_dropout_prob": 0.1,
8
+ "decoder_hidden_size": 256,
9
+ "depths": [
10
+ 2,
11
+ 2,
12
+ 2,
13
+ 2
14
+ ],
15
+ "downsampling_rates": [
16
+ 1,
17
+ 4,
18
+ 8,
19
+ 16
20
+ ],
21
+ "drop_path_rate": 0.1,
22
+ "hidden_act": "gelu",
23
+ "hidden_dropout_prob": 0.0,
24
+ "hidden_sizes": [
25
+ 32,
26
+ 64,
27
+ 160,
28
+ 256
29
+ ],
30
+ "id2label": {
31
+ "0": "unlabeled",
32
+ "1": "road",
33
+ "2": "side walk",
34
+ "3": "car",
35
+ "4": "pedestrian",
36
+ "5": "sign",
37
+ "6": "other"
38
+ },
39
+ "image_size": 224,
40
+ "initializer_range": 0.02,
41
+ "label2id": {
42
+ "car": 3,
43
+ "other": 6,
44
+ "pedestrian": 4,
45
+ "road": 1,
46
+ "side walk": 2,
47
+ "sign": 5,
48
+ "unlabeled": 0
49
+ },
50
+ "layer_norm_eps": 1e-06,
51
+ "mlp_ratios": [
52
+ 4,
53
+ 4,
54
+ 4,
55
+ 4
56
+ ],
57
+ "model_type": "segformer",
58
+ "num_attention_heads": [
59
+ 1,
60
+ 2,
61
+ 5,
62
+ 8
63
+ ],
64
+ "num_channels": 3,
65
+ "num_encoder_blocks": 4,
66
+ "patch_sizes": [
67
+ 7,
68
+ 3,
69
+ 3,
70
+ 3
71
+ ],
72
+ "reshape_last_stage": true,
73
+ "semantic_loss_ignore_index": 255,
74
+ "sr_ratios": [
75
+ 8,
76
+ 4,
77
+ 2,
78
+ 1
79
+ ],
80
+ "strides": [
81
+ 4,
82
+ 2,
83
+ 2,
84
+ 2
85
+ ],
86
+ "torch_dtype": "float32",
87
+ "transformers_version": "4.36.2"
88
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05a5faa7c61425e636a4e151c2a842e8556cbcec35766f9d71d5c6d07becdf09
3
+ size 14889924
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9acacd0b4f9409b5f9e34b8f6fb755bfd13fed64ffd4d48d229a17a68f88e16
3
+ size 4728