matnun commited on
Commit
66c7f5e
·
1 Parent(s): 3b081c6

Upload 3 files

Browse files
Files changed (3) hide show
  1. README.md +66 -0
  2. config.json +144 -0
  3. training_args.bin +3 -0
README.md ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: other
3
+ tags:
4
+ - vision
5
+ - image-segmentation
6
+ - generated_from_trainer
7
+ model-index:
8
+ - name: segformer-b0-finetuned-segments-sidewalk-2
9
+ results: []
10
+ ---
11
+
12
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
13
+ should probably proofread and complete it, then remove this comment. -->
14
+
15
+ # segformer-b0-finetuned-segments-sidewalk-2
16
+
17
+ This model is a fine-tuned version of [nvidia/mit-b0](https://huggingface.co/nvidia/mit-b0) on the segments/sidewalk-semantic dataset.
18
+ It achieves the following results on the evaluation set:
19
+ - Loss: 1.9042
20
+ - Mean Iou: 0.1600
21
+ - Mean Accuracy: 0.1997
22
+ - Overall Accuracy: 0.7338
23
+ - Per Category Iou: [nan, 0.27359520957005035, 0.6563592089876799, 0.0, 0.23344374046535918, 0.0, nan, 0.0, 0.0, 0.0, 0.5539341917024321, nan, nan, nan, nan, 0.0, 0.0, nan, 0.6213519498256361, 0.0, 0.0, 0.0, nan, nan, 0.0, 0.0, 0.0, 0.0, 0.8012808797206368, 0.0, 0.8609473035107046, nan, 0.0, 0.0, 0.0]
24
+ - Per Category Accuracy: [nan, 0.38598740280061317, 0.9344800917343116, 0.0, 0.23402267811135147, 0.0, nan, 0.0, 0.0, 0.0, 0.6574569071869553, nan, nan, nan, nan, 0.0, 0.0, nan, 0.889953470705536, 0.0, 0.0, 0.0, nan, nan, 0.0, 0.0, 0.0, 0.0, 0.9339123774958169, 0.0, 0.9562267789312698, nan, 0.0, 0.0, 0.0]
25
+
26
+ ## Model description
27
+
28
+ More information needed
29
+
30
+ ## Intended uses & limitations
31
+
32
+ More information needed
33
+
34
+ ## Training and evaluation data
35
+
36
+ More information needed
37
+
38
+ ## Training procedure
39
+
40
+ ### Training hyperparameters
41
+
42
+ The following hyperparameters were used during training:
43
+ - learning_rate: 6e-05
44
+ - train_batch_size: 2
45
+ - eval_batch_size: 2
46
+ - seed: 42
47
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
48
+ - lr_scheduler_type: linear
49
+ - num_epochs: 2
50
+
51
+ ### Training results
52
+
53
+ | Training Loss | Epoch | Step | Validation Loss | Mean Iou | Mean Accuracy | Overall Accuracy | Per Category Iou | Per Category Accuracy |
54
+ |:-------------:|:-----:|:----:|:---------------:|:--------:|:-------------:|:----------------:|:----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------:|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------:|
55
+ | 2.8419 | 0.42 | 20 | 3.2243 | 0.1239 | 0.1973 | 0.6992 | [0.0, 0.221283072298205, 0.6482498250140304, 0.0, 0.36607695456244177, 0.013827775204570018, nan, 1.0254201659129828e-05, 0.0, 0.0, 0.5416500682753081, nan, 0.0, 0.0, nan, 0.0, 0.0, 0.0, 0.5339731316050166, 0.0, 0.0006440571922786744, 0.0, nan, 0.0, 0.0, 0.0, 0.0, 0.0, 0.7498440701547007, 0.0, 0.7659222854515146, 0.0, 0.0, 0.0, 0.0] | [nan, 0.3346613609105567, 0.8582083544770268, 0.0, 0.5101472837243907, 0.015482685970504024, nan, 1.0366454154356502e-05, 0.0, 0.0, 0.6745826026281508, nan, nan, nan, nan, 0.0, 0.0, nan, 0.8093545247364923, 0.0, 0.0006458279514337381, 0.0, nan, nan, 0.0, 0.0, 0.0, 0.0, 0.9324806212895075, 0.0, 0.797418357423677, nan, 0.0, 0.0, 0.0] |
56
+ | 2.3662 | 0.83 | 40 | 2.5147 | 0.1402 | 0.1798 | 0.6989 | [nan, 0.19549119549985344, 0.6036027201962391, 0.0, 0.0019222772099991463, 0.000300503343099692, nan, 0.0, 0.0, 0.0, 0.47853978429259575, nan, nan, nan, nan, 0.0, 0.0, nan, 0.5820555774612892, 0.0, 0.0, 0.0, nan, nan, 0.0, 0.0, 0.0, 0.0, 0.7898452112422248, 0.0, 0.8521568687502872, nan, 0.0, 0.0, 0.0] | [nan, 0.25107981668136076, 0.9396577375184628, 0.0, 0.0019233683746435017, 0.0003025228242666523, nan, 0.0, 0.0, 0.0, 0.5513810659584686, nan, nan, nan, nan, 0.0, 0.0, nan, 0.8953553793561865, 0.0, 0.0, 0.0, nan, nan, 0.0, 0.0, 0.0, 0.0, 0.9300976130892274, 0.0, 0.9250758451014455, nan, 0.0, 0.0, 0.0] |
57
+ | 2.1745 | 1.25 | 60 | 2.0428 | 0.1485 | 0.1882 | 0.7162 | [nan, 0.24240648716131, 0.6262941164542789, 0.0, 0.04440846090507781, 0.0, nan, 0.0, 0.0, 0.0, 0.522913696330921, nan, nan, nan, nan, 0.0, 0.0, nan, 0.6194890050543631, 0.0, 0.0, 0.0, nan, nan, 0.0, 0.0, 0.0, 0.0, 0.7947837731119848, 0.0, 0.8609570537373858, nan, 0.0, 0.0, 0.0] | [nan, 0.3318909301752965, 0.9392945927202885, 0.0, 0.04443587164684973, 0.0, nan, 0.0, 0.0, 0.0, 0.6149676720993105, nan, nan, nan, nan, 0.0, 0.0, nan, 0.8836542113759377, 0.0, 0.0, 0.0, nan, nan, 0.0, 0.0, 0.0, 0.0, 0.9409947331534898, 0.0, 0.9509521157666382, nan, 0.0, 0.0, 0.0] |
58
+ | 1.986 | 1.67 | 80 | 1.9042 | 0.1600 | 0.1997 | 0.7338 | [nan, 0.27359520957005035, 0.6563592089876799, 0.0, 0.23344374046535918, 0.0, nan, 0.0, 0.0, 0.0, 0.5539341917024321, nan, nan, nan, nan, 0.0, 0.0, nan, 0.6213519498256361, 0.0, 0.0, 0.0, nan, nan, 0.0, 0.0, 0.0, 0.0, 0.8012808797206368, 0.0, 0.8609473035107046, nan, 0.0, 0.0, 0.0] | [nan, 0.38598740280061317, 0.9344800917343116, 0.0, 0.23402267811135147, 0.0, nan, 0.0, 0.0, 0.0, 0.6574569071869553, nan, nan, nan, nan, 0.0, 0.0, nan, 0.889953470705536, 0.0, 0.0, 0.0, nan, nan, 0.0, 0.0, 0.0, 0.0, 0.9339123774958169, 0.0, 0.9562267789312698, nan, 0.0, 0.0, 0.0] |
59
+
60
+
61
+ ### Framework versions
62
+
63
+ - Transformers 4.23.1
64
+ - Pytorch 1.12.1+cu113
65
+ - Datasets 2.5.2
66
+ - Tokenizers 0.13.1
config.json ADDED
@@ -0,0 +1,144 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "nvidia/mit-b0",
3
+ "architectures": [
4
+ "SegformerForSemanticSegmentation"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.0,
7
+ "classifier_dropout_prob": 0.1,
8
+ "decoder_hidden_size": 256,
9
+ "depths": [
10
+ 2,
11
+ 2,
12
+ 2,
13
+ 2
14
+ ],
15
+ "downsampling_rates": [
16
+ 1,
17
+ 4,
18
+ 8,
19
+ 16
20
+ ],
21
+ "drop_path_rate": 0.1,
22
+ "hidden_act": "gelu",
23
+ "hidden_dropout_prob": 0.0,
24
+ "hidden_sizes": [
25
+ 32,
26
+ 64,
27
+ 160,
28
+ 256
29
+ ],
30
+ "id2label": {
31
+ "0": "unlabeled",
32
+ "1": "flat-road",
33
+ "2": "flat-sidewalk",
34
+ "3": "flat-crosswalk",
35
+ "4": "flat-cyclinglane",
36
+ "5": "flat-parkingdriveway",
37
+ "6": "flat-railtrack",
38
+ "7": "flat-curb",
39
+ "8": "human-person",
40
+ "9": "human-rider",
41
+ "10": "vehicle-car",
42
+ "11": "vehicle-truck",
43
+ "12": "vehicle-bus",
44
+ "13": "vehicle-tramtrain",
45
+ "14": "vehicle-motorcycle",
46
+ "15": "vehicle-bicycle",
47
+ "16": "vehicle-caravan",
48
+ "17": "vehicle-cartrailer",
49
+ "18": "construction-building",
50
+ "19": "construction-door",
51
+ "20": "construction-wall",
52
+ "21": "construction-fenceguardrail",
53
+ "22": "construction-bridge",
54
+ "23": "construction-tunnel",
55
+ "24": "construction-stairs",
56
+ "25": "object-pole",
57
+ "26": "object-trafficsign",
58
+ "27": "object-trafficlight",
59
+ "28": "nature-vegetation",
60
+ "29": "nature-terrain",
61
+ "30": "sky",
62
+ "31": "void-ground",
63
+ "32": "void-dynamic",
64
+ "33": "void-static",
65
+ "34": "void-unclear"
66
+ },
67
+ "image_size": 224,
68
+ "initializer_range": 0.02,
69
+ "label2id": {
70
+ "construction-bridge": 22,
71
+ "construction-building": 18,
72
+ "construction-door": 19,
73
+ "construction-fenceguardrail": 21,
74
+ "construction-stairs": 24,
75
+ "construction-tunnel": 23,
76
+ "construction-wall": 20,
77
+ "flat-crosswalk": 3,
78
+ "flat-curb": 7,
79
+ "flat-cyclinglane": 4,
80
+ "flat-parkingdriveway": 5,
81
+ "flat-railtrack": 6,
82
+ "flat-road": 1,
83
+ "flat-sidewalk": 2,
84
+ "human-person": 8,
85
+ "human-rider": 9,
86
+ "nature-terrain": 29,
87
+ "nature-vegetation": 28,
88
+ "object-pole": 25,
89
+ "object-trafficlight": 27,
90
+ "object-trafficsign": 26,
91
+ "sky": 30,
92
+ "unlabeled": 0,
93
+ "vehicle-bicycle": 15,
94
+ "vehicle-bus": 12,
95
+ "vehicle-car": 10,
96
+ "vehicle-caravan": 16,
97
+ "vehicle-cartrailer": 17,
98
+ "vehicle-motorcycle": 14,
99
+ "vehicle-tramtrain": 13,
100
+ "vehicle-truck": 11,
101
+ "void-dynamic": 32,
102
+ "void-ground": 31,
103
+ "void-static": 33,
104
+ "void-unclear": 34
105
+ },
106
+ "layer_norm_eps": 1e-06,
107
+ "mlp_ratios": [
108
+ 4,
109
+ 4,
110
+ 4,
111
+ 4
112
+ ],
113
+ "model_type": "segformer",
114
+ "num_attention_heads": [
115
+ 1,
116
+ 2,
117
+ 5,
118
+ 8
119
+ ],
120
+ "num_channels": 3,
121
+ "num_encoder_blocks": 4,
122
+ "patch_sizes": [
123
+ 7,
124
+ 3,
125
+ 3,
126
+ 3
127
+ ],
128
+ "reshape_last_stage": true,
129
+ "semantic_loss_ignore_index": 255,
130
+ "sr_ratios": [
131
+ 8,
132
+ 4,
133
+ 2,
134
+ 1
135
+ ],
136
+ "strides": [
137
+ 4,
138
+ 2,
139
+ 2,
140
+ 2
141
+ ],
142
+ "torch_dtype": "float32",
143
+ "transformers_version": "4.23.1"
144
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bee57adcaeb94b6abdb3dcdcb8641f9ccb208c2253aff1a9b0be802d59da305
3
+ size 3439