ramdrop commited on
Commit
a7d69eb
1 Parent(s): 32c539a

add weights

Browse files
datt_eurosat/wandb/latest-run/files/config.yaml ADDED
@@ -0,0 +1,262 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ wandb_version: 1
2
+
3
+ CONFIG:
4
+ desc: null
5
+ value: datt_mix_ctrs.yaml
6
+ MODEL:
7
+ desc: null
8
+ value:
9
+ TYPE: dat
10
+ NAME: dat_plus_plus
11
+ PRETRAINED: pretrained_weights/dat_pp_tiny_in1k_224.pth
12
+ DAT:
13
+ img_size: 224
14
+ patch_size: 4
15
+ num_classes: 1000
16
+ expansion: 4
17
+ dim_stem: 64
18
+ dims:
19
+ - 64
20
+ - 128
21
+ - 256
22
+ - 512
23
+ depths:
24
+ - 2
25
+ - 4
26
+ - 18
27
+ - 2
28
+ stage_spec:
29
+ - - N
30
+ - D
31
+ - - N
32
+ - D
33
+ - N
34
+ - D
35
+ - - N
36
+ - D
37
+ - N
38
+ - D
39
+ - N
40
+ - D
41
+ - N
42
+ - D
43
+ - N
44
+ - D
45
+ - N
46
+ - D
47
+ - N
48
+ - D
49
+ - N
50
+ - D
51
+ - N
52
+ - D
53
+ - - D
54
+ - D
55
+ heads:
56
+ - 2
57
+ - 4
58
+ - 8
59
+ - 16
60
+ window_sizes:
61
+ - 7
62
+ - 7
63
+ - 7
64
+ - 7
65
+ groups:
66
+ - 1
67
+ - 2
68
+ - 4
69
+ - 8
70
+ use_pes:
71
+ - true
72
+ - true
73
+ - true
74
+ - true
75
+ dwc_pes:
76
+ - false
77
+ - false
78
+ - false
79
+ - false
80
+ strides:
81
+ - 8
82
+ - 4
83
+ - 2
84
+ - 1
85
+ offset_range_factor:
86
+ - -1
87
+ - -1
88
+ - -1
89
+ - -1
90
+ no_offs:
91
+ - false
92
+ - false
93
+ - false
94
+ - false
95
+ fixed_pes:
96
+ - false
97
+ - false
98
+ - false
99
+ - false
100
+ use_dwc_mlps:
101
+ - true
102
+ - true
103
+ - true
104
+ - true
105
+ use_lpus:
106
+ - true
107
+ - true
108
+ - true
109
+ - true
110
+ use_conv_patches: true
111
+ ksizes:
112
+ - 9
113
+ - 7
114
+ - 5
115
+ - 3
116
+ nat_ksizes:
117
+ - 7
118
+ - 7
119
+ - 7
120
+ - 7
121
+ drop_rate: 0.0
122
+ attn_drop_rate: 0.0
123
+ drop_path_rate: 0.2
124
+ clip_dim: 1024
125
+ quantization:
126
+ method: jacob
127
+ weight:
128
+ num_bits: 8
129
+ axis: per_channel
130
+ calib_method: max
131
+ activation:
132
+ num_bits: 8
133
+ axis: per_tensor
134
+ calib_method: max
135
+ calibration:
136
+ num_batch: 2
137
+ modal: rgbd
138
+ TRAIN:
139
+ desc: null
140
+ value:
141
+ EPOCHS: 120
142
+ WARMUP_EPOCHS: 0
143
+ BASE_LR: 1.0e-06
144
+ WEIGHT_DECAY: 0.05
145
+ WARMUP_LR: 5.0e-07
146
+ MIN_LR: 5.0e-07
147
+ CLIP_GRAD: 5.0
148
+ LR_SCHEDULER:
149
+ NAME: cosine
150
+ DECAY_EPOCHS: 30
151
+ DECAY_RATE: 0.1
152
+ OPTIMIZER:
153
+ NAME: adamw
154
+ EPS: 1.0e-08
155
+ BETAS:
156
+ - 0.9
157
+ - 0.999
158
+ MOMENTUM: 0.9
159
+ CRETERION:
160
+ NAME: TripletMarginLoss
161
+ TRIPLET_MARGIN: 0.3
162
+ MINING_METHOD:
163
+ POSITIVE: easy
164
+ NEGATIVE: random
165
+ TOTAL: semihard
166
+ NEG_NUM: 3
167
+ KD:
168
+ ENABLE: false
169
+ WEIGHT: 10
170
+ WEIGHT: 0.05
171
+ DATA:
172
+ desc: null
173
+ value:
174
+ DATASET: eurosat
175
+ ROOT: dbs
176
+ BATCH_SIZE: 4
177
+ VAL_BATCH_SIZE: 32
178
+ EMBEDDING_BATCH_SIZE: 32
179
+ DEPTH_TRANSFORM: rgb
180
+ IS_SUBSET: true
181
+ LABEL_TYPE: pseudo_labels
182
+ DATASET_THRESHOLD: 0.25
183
+ GPU:
184
+ desc: null
185
+ value: 0
186
+ SEED:
187
+ desc: null
188
+ value: 1
189
+ CLIP_MODEL:
190
+ desc: null
191
+ value:
192
+ NAME: ViT-g-14
193
+ PRETRAINED: laion2b_s34b_b88k
194
+ MODAL:
195
+ desc: null
196
+ value: depth
197
+ PHASE:
198
+ desc: null
199
+ value: train_ctrs
200
+ CKPT:
201
+ desc: null
202
+ value: logs/datt_0216_103917/wandb/latest-run/files/src/best_model.pth
203
+ MIX_INPUT:
204
+ desc: null
205
+ value:
206
+ ENABLE: true
207
+ NUM_MIX: 2
208
+ WEIGHTED: false
209
+ ATTENTION:
210
+ desc: null
211
+ value:
212
+ ENABLE: false
213
+ WEIGHTED_SAMPLE:
214
+ desc: null
215
+ value:
216
+ ENABLE: false
217
+ cmd:
218
+ desc: null
219
+ value: run.py --phase=train_ctrs --config=configs/eurosat/datt_mix_ctrs.yaml --quant_config=quantization_configs/d2_jacob.yaml
220
+ _wandb:
221
+ desc: null
222
+ value:
223
+ code_path: code/run.py
224
+ python_version: 3.10.13
225
+ cli_version: 0.16.3
226
+ framework: huggingface
227
+ huggingface_version: 4.37.2
228
+ is_jupyter_run: false
229
+ is_kaggle_kernel: false
230
+ start_time: 1708267535.486106
231
+ t:
232
+ 1:
233
+ - 1
234
+ - 5
235
+ - 11
236
+ - 41
237
+ - 49
238
+ - 53
239
+ - 55
240
+ - 63
241
+ - 80
242
+ 2:
243
+ - 1
244
+ - 5
245
+ - 11
246
+ - 41
247
+ - 49
248
+ - 53
249
+ - 55
250
+ - 63
251
+ - 80
252
+ 3:
253
+ - 3
254
+ - 13
255
+ - 16
256
+ - 23
257
+ 4: 3.10.13
258
+ 5: 0.16.3
259
+ 6: 4.37.2
260
+ 8:
261
+ - 5
262
+ 13: linux-x86_64
datt_eurosat/wandb/latest-run/files/src/best_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eeccf2981a37d8d7bd0b37ba51bd4b2af553772ba3fb57313c6e118dff5229e
3
+ size 98227739
datt_eurosat/wandb/latest-run/files/src/datt_mix_ctrs.yaml ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ CONFIG: datt_mix_ctrs.yaml
2
+ MODEL:
3
+ TYPE: dat
4
+ NAME: dat_plus_plus
5
+ PRETRAINED: "pretrained_weights/dat_pp_tiny_in1k_224.pth"
6
+ DAT:
7
+ img_size: 224
8
+ patch_size: 4
9
+ num_classes: 1000
10
+ expansion: 4
11
+ dim_stem: 64
12
+ dims: [64, 128, 256, 512]
13
+ depths: [2, 4, 18, 2]
14
+ stage_spec: [[N, D], [N, D, N, D], [N, D, N, D, N, D, N, D, N, D, N, D, N, D, N, D, N, D], [D, D]]
15
+ heads: [2, 4, 8, 16]
16
+ window_sizes: [7, 7, 7, 7]
17
+ groups: [1, 2, 4, 8]
18
+ use_pes: [True, True, True, True]
19
+ dwc_pes: [False, False, False, False]
20
+ strides: [8, 4, 2, 1]
21
+ offset_range_factor: [-1, -1, -1, -1]
22
+ no_offs: [False, False, False, False]
23
+ fixed_pes: [False, False, False, False]
24
+ use_dwc_mlps: [True, True, True, True]
25
+ use_lpus: [True, True, True, True]
26
+ use_conv_patches: True
27
+ ksizes: [9, 7, 5, 3]
28
+ nat_ksizes: [7, 7, 7, 7]
29
+ drop_rate: 0.0
30
+ attn_drop_rate: 0.0
31
+ drop_path_rate: 0.2
32
+ # quant_bit: 8
33
+ clip_dim: 1024
34
+
35
+
36
+ TRAIN:
37
+ EPOCHS: 120
38
+ WARMUP_EPOCHS: 0
39
+ BASE_LR: 1e-6
40
+ WEIGHT_DECAY: 0.05
41
+ WARMUP_LR: 5e-7
42
+ MIN_LR: 5e-7
43
+ CLIP_GRAD: 5.0
44
+ LR_SCHEDULER:
45
+ NAME: "cosine"
46
+ DECAY_EPOCHS: 30
47
+ DECAY_RATE: 0.1
48
+ OPTIMIZER:
49
+ NAME: "adamw"
50
+ EPS: 1e-8
51
+ BETAS: [0.9, 0.999]
52
+ MOMENTUM: 0.9
53
+ CRETERION:
54
+ NAME: "TripletMarginLoss" # MSE
55
+ TRIPLET_MARGIN: 0.3
56
+ MINING_METHOD:
57
+ POSITIVE: "easy" # easy, hard, random
58
+ NEGATIVE: "random" # easy, hard, random
59
+ TOTAL: "semihard" # all, semihard, hard
60
+ NEG_NUM: 3
61
+ KD:
62
+ ENABLE: False
63
+ WEIGHT: 10
64
+ WEIGHT: 5e-2
65
+
66
+ DATA:
67
+ DATASET: "eurosat"
68
+ ROOT: "dbs"
69
+ BATCH_SIZE: 4
70
+ VAL_BATCH_SIZE: 32
71
+ EMBEDDING_BATCH_SIZE: 32
72
+ DEPTH_TRANSFORM: "rgb"
73
+ IS_SUBSET: True
74
+ LABEL_TYPE: "pseudo_labels" # "gt" or "clip_vitb32"
75
+ DATASET_THRESHOLD: 0.25
76
+
77
+
78
+ GPU: 0
79
+ SEED: 1
80
+ CLIP_MODEL:
81
+ NAME: "ViT-g-14" # "ViT-B/32"
82
+ PRETRAINED: "laion2b_s34b_b88k"
83
+ MODAL: "depth" # "rgb" or "depth"
84
+ PHASE: "train_ctrs" # "train_ctrs" # "test"
85
+ CKPT: "logs/datt_0216_103917/wandb/latest-run/files/src/best_model.pth"
86
+
87
+ # [] Mix Input
88
+ MIX_INPUT:
89
+ ENABLE: True
90
+ NUM_MIX: 2
91
+ WEIGHTED: False
92
+
93
+ # [] Attention
94
+ ATTENTION:
95
+ ENABLE: False
96
+
97
+ # [] Weighted samples
98
+ WEIGHTED_SAMPLE:
99
+ ENABLE: False
swint_eurosat/wandb/latest-run/files/config.yaml ADDED
@@ -0,0 +1,183 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ wandb_version: 1
2
+
3
+ CONFIG:
4
+ desc: null
5
+ value: swint_mix_ctrs.yaml
6
+ FUSED_WINDOW_PROCESS:
7
+ desc: null
8
+ value: false
9
+ MODEL:
10
+ desc: null
11
+ value:
12
+ TYPE: swin
13
+ NAME: swin_tiny_patch4_window7_224
14
+ DROP_PATH_RATE: 0.3
15
+ DROP_RATE: 0.0
16
+ NUM_CLASSES: 1000
17
+ PRETRAINED: pretrained_weights/swin_tiny_patch4_window7_224.pth
18
+ SWIN:
19
+ EMBED_DIM: 96
20
+ DEPTHS:
21
+ - 2
22
+ - 2
23
+ - 18
24
+ - 2
25
+ NUM_HEADS:
26
+ - 3
27
+ - 6
28
+ - 12
29
+ - 24
30
+ WINDOW_SIZE: 7
31
+ PATCH_SIZE: 4
32
+ IN_CHANS: 3
33
+ MLP_RATIO: 4.0
34
+ QK_SCALE: null
35
+ QKV_BIAS: true
36
+ APE: false
37
+ PATCH_NORM: true
38
+ clip_dim: 1024
39
+ TRAIN:
40
+ desc: null
41
+ value:
42
+ EPOCHS: 120
43
+ WARMUP_EPOCHS: 0
44
+ USE_CHECKPOINT: false
45
+ BASE_LR: 1.0e-06
46
+ WEIGHT_DECAY: 0.001
47
+ WARMUP_LR: 5.0e-07
48
+ MIN_LR: 5.0e-07
49
+ CLIP_GRAD: 5.0
50
+ LR_SCHEDULER:
51
+ NAME: cosine
52
+ DECAY_EPOCHS: 30
53
+ DECAY_RATE: 0.1
54
+ MULTISTEPS: []
55
+ WARMUP_PREFIX: true
56
+ OPTIMIZER:
57
+ NAME: adamw
58
+ EPS: 1.0e-08
59
+ BETAS:
60
+ - 0.9
61
+ - 0.999
62
+ MOMENTUM: 0.9
63
+ CRETERION:
64
+ NAME: TripletMarginLoss
65
+ TRIPLET_MARGIN: 0.3
66
+ MINING_METHOD:
67
+ POSITIVE: easy
68
+ NEGATIVE: random
69
+ TOTAL: semihard
70
+ NEG_NUM: 3
71
+ KD:
72
+ ENABLE: false
73
+ WEIGHT: 10
74
+ WEIGHT: 0.05
75
+ DATA:
76
+ desc: null
77
+ value:
78
+ DATASET: eurosat
79
+ IMG_SIZE: 224
80
+ ROOT: dbs
81
+ BATCH_SIZE: 4
82
+ VAL_BATCH_SIZE: 32
83
+ EMBEDDING_BATCH_SIZE: 32
84
+ DEPTH_TRANSFORM: rgb
85
+ LABEL_TYPE: pseudo_labels
86
+ IS_SUBSET: true
87
+ DATASET_THRESHOLD: 0.25
88
+ GPU:
89
+ desc: null
90
+ value: 0
91
+ SEED:
92
+ desc: null
93
+ value: 1
94
+ CLIP_MODEL:
95
+ desc: null
96
+ value:
97
+ NAME: ViT-g-14
98
+ PRETRAINED: laion2b_s34b_b88k
99
+ MODAL:
100
+ desc: null
101
+ value: depth
102
+ PHASE:
103
+ desc: null
104
+ value: train_ctrs
105
+ CKPT:
106
+ desc: null
107
+ value: logs/swint_0215_162527/wandb/latest-run/files/src/best_model.pth
108
+ MIX_INPUT:
109
+ desc: null
110
+ value:
111
+ ENABLE: true
112
+ NUM_MIX: 2
113
+ WEIGHTED: false
114
+ ATTENTION:
115
+ desc: null
116
+ value:
117
+ ENABLE: false
118
+ WEIGHTED_SAMPLE:
119
+ desc: null
120
+ value:
121
+ ENABLE: false
122
+ quantization:
123
+ desc: null
124
+ value:
125
+ method: jacob
126
+ weight:
127
+ num_bits: 8
128
+ axis: per_channel
129
+ calib_method: max
130
+ activation:
131
+ num_bits: 8
132
+ axis: per_tensor
133
+ calib_method: max
134
+ calibration:
135
+ num_batch: 2
136
+ modal: rgbd
137
+ pre_calibration: false
138
+ cmd:
139
+ desc: null
140
+ value: run.py --phase=train_ctrs --config=configs/eurosat/swint_mix_ctrs.yaml --quant_config=quantization_configs/d2_jacob.yaml
141
+ _wandb:
142
+ desc: null
143
+ value:
144
+ code_path: code/run.py
145
+ python_version: 3.10.13
146
+ cli_version: 0.16.3
147
+ framework: huggingface
148
+ huggingface_version: 4.37.2
149
+ is_jupyter_run: false
150
+ is_kaggle_kernel: false
151
+ start_time: 1708267778.770682
152
+ t:
153
+ 1:
154
+ - 1
155
+ - 5
156
+ - 11
157
+ - 41
158
+ - 49
159
+ - 53
160
+ - 55
161
+ - 63
162
+ - 80
163
+ 2:
164
+ - 1
165
+ - 5
166
+ - 11
167
+ - 41
168
+ - 49
169
+ - 53
170
+ - 55
171
+ - 63
172
+ - 80
173
+ 3:
174
+ - 3
175
+ - 13
176
+ - 16
177
+ - 23
178
+ 4: 3.10.13
179
+ 5: 0.16.3
180
+ 6: 4.37.2
181
+ 8:
182
+ - 5
183
+ 13: linux-x86_64
swint_eurosat/wandb/latest-run/files/src/best_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21965d68e262ac3e99f8df5f1367bd2ea22a7b654c5853598e55b9529e790284
3
+ size 200253173
swint_eurosat/wandb/latest-run/files/src/swint_mix_ctrs.yaml ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ CONFIG: swint_mix_ctrs.yaml
2
+ FUSED_WINDOW_PROCESS: False
3
+ MODEL:
4
+ TYPE: swin
5
+ NAME: swin_tiny_patch4_window7_224
6
+ DROP_PATH_RATE: 0.3
7
+ DROP_RATE: 0.0
8
+ NUM_CLASSES: 1000
9
+ PRETRAINED: pretrained_weights/swin_tiny_patch4_window7_224.pth
10
+
11
+ SWIN:
12
+ EMBED_DIM: 96
13
+ DEPTHS: [ 2, 2, 18, 2 ]
14
+ NUM_HEADS: [ 3, 6, 12, 24 ]
15
+ WINDOW_SIZE: 7
16
+ PATCH_SIZE: 4
17
+ IN_CHANS: 3
18
+ MLP_RATIO: 4.0
19
+ QK_SCALE:
20
+ QKV_BIAS: True
21
+ APE: False
22
+ PATCH_NORM: True
23
+
24
+ clip_dim: 1024
25
+
26
+
27
+ TRAIN:
28
+ EPOCHS: 120
29
+ WARMUP_EPOCHS: 0
30
+ USE_CHECKPOINT: False
31
+ BASE_LR: 1e-6
32
+ WEIGHT_DECAY: 1e-3
33
+ WARMUP_LR: 5e-7
34
+ MIN_LR: 5e-7
35
+ CLIP_GRAD: 5.0
36
+ LR_SCHEDULER:
37
+ NAME: "cosine"
38
+ DECAY_EPOCHS: 30
39
+ DECAY_RATE: 0.1
40
+ MULTISTEPS: []
41
+ WARMUP_PREFIX: True
42
+ OPTIMIZER:
43
+ NAME: "adamw"
44
+ EPS: 1e-8
45
+ BETAS: [0.9, 0.999]
46
+ MOMENTUM: 0.9
47
+ CRETERION:
48
+ NAME: "TripletMarginLoss" # MSE
49
+ TRIPLET_MARGIN: 0.3
50
+ MINING_METHOD:
51
+ POSITIVE: "easy" # easy, hard, random
52
+ NEGATIVE: "random" # easy, hard, random
53
+ TOTAL: "semihard" # all, semihard, hard
54
+ NEG_NUM: 3
55
+ KD:
56
+ ENABLE: False
57
+ WEIGHT: 10
58
+ WEIGHT: 5e-2
59
+
60
+ DATA:
61
+ DATASET: "eurosat"
62
+ IMG_SIZE: 224
63
+ ROOT: "dbs"
64
+ BATCH_SIZE: 4
65
+ VAL_BATCH_SIZE: 32
66
+ EMBEDDING_BATCH_SIZE: 32
67
+ DEPTH_TRANSFORM: "rgb"
68
+ LABEL_TYPE: "pseudo_labels" # "gt" or "clip_vitb32"
69
+ IS_SUBSET: True
70
+ DATASET_THRESHOLD: 0.25
71
+
72
+ GPU: 0
73
+ SEED: 1
74
+ CLIP_MODEL:
75
+ NAME: "ViT-g-14" # "ViT-B/32"
76
+ PRETRAINED: "laion2b_s34b_b88k"
77
+ MODAL: "depth" # "rgb" or "depth"
78
+ PHASE: "train_ctrs" # "train_ctrs" # "test"
79
+ CKPT: "logs/swint_0215_162527/wandb/latest-run/files/src/best_model.pth"
80
+
81
+ # [] Mix Input
82
+ MIX_INPUT:
83
+ ENABLE: True
84
+ NUM_MIX: 2
85
+ WEIGHTED: False
86
+
87
+ # [] Attention
88
+ ATTENTION:
89
+ ENABLE: False
90
+
91
+ # [] Weighted samples
92
+ WEIGHTED_SAMPLE:
93
+ ENABLE: False
94
+
swint_scannet/wandb/latest-run/files/config.yaml ADDED
@@ -0,0 +1,183 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ wandb_version: 1
2
+
3
+ CONFIG:
4
+ desc: null
5
+ value: swint_mix_ctrs.yaml
6
+ FUSED_WINDOW_PROCESS:
7
+ desc: null
8
+ value: false
9
+ MODEL:
10
+ desc: null
11
+ value:
12
+ TYPE: swin
13
+ NAME: swin_tiny_patch4_window7_224
14
+ DROP_PATH_RATE: 0.3
15
+ DROP_RATE: 0.0
16
+ NUM_CLASSES: 1000
17
+ PRETRAINED: pretrained_weights/swin_tiny_patch4_window7_224.pth
18
+ SWIN:
19
+ EMBED_DIM: 96
20
+ DEPTHS:
21
+ - 2
22
+ - 2
23
+ - 18
24
+ - 2
25
+ NUM_HEADS:
26
+ - 3
27
+ - 6
28
+ - 12
29
+ - 24
30
+ WINDOW_SIZE: 7
31
+ PATCH_SIZE: 4
32
+ IN_CHANS: 3
33
+ MLP_RATIO: 4.0
34
+ QK_SCALE: null
35
+ QKV_BIAS: true
36
+ APE: false
37
+ PATCH_NORM: true
38
+ clip_dim: 1024
39
+ TRAIN:
40
+ desc: null
41
+ value:
42
+ EPOCHS: 120
43
+ WARMUP_EPOCHS: 0
44
+ USE_CHECKPOINT: false
45
+ BASE_LR: 1.0e-06
46
+ WEIGHT_DECAY: 0.001
47
+ WARMUP_LR: 5.0e-07
48
+ MIN_LR: 5.0e-07
49
+ CLIP_GRAD: 5.0
50
+ LR_SCHEDULER:
51
+ NAME: cosine
52
+ DECAY_EPOCHS: 30
53
+ DECAY_RATE: 0.1
54
+ MULTISTEPS: []
55
+ WARMUP_PREFIX: true
56
+ OPTIMIZER:
57
+ NAME: adamw
58
+ EPS: 1.0e-08
59
+ BETAS:
60
+ - 0.9
61
+ - 0.999
62
+ MOMENTUM: 0.9
63
+ CRETERION:
64
+ NAME: TripletMarginLoss
65
+ TRIPLET_MARGIN: 0.3
66
+ MINING_METHOD:
67
+ POSITIVE: easy
68
+ NEGATIVE: random
69
+ TOTAL: semihard
70
+ NEG_NUM: 3
71
+ KD:
72
+ ENABLE: false
73
+ WEIGHT: 10
74
+ WEIGHT: 0.05
75
+ DATA:
76
+ desc: null
77
+ value:
78
+ DATASET: scannet
79
+ IMG_SIZE: 224
80
+ ROOT: dbs
81
+ BATCH_SIZE: 4
82
+ VAL_BATCH_SIZE: 32
83
+ EMBEDDING_BATCH_SIZE: 32
84
+ DEPTH_TRANSFORM: rgb
85
+ LABEL_TYPE: pseudo_labels
86
+ IS_SUBSET: true
87
+ DATASET_THRESHOLD: 0.25
88
+ GPU:
89
+ desc: null
90
+ value: 0
91
+ SEED:
92
+ desc: null
93
+ value: 1
94
+ CLIP_MODEL:
95
+ desc: null
96
+ value:
97
+ NAME: ViT-g-14
98
+ PRETRAINED: laion2b_s34b_b88k
99
+ MODAL:
100
+ desc: null
101
+ value: depth
102
+ PHASE:
103
+ desc: null
104
+ value: train_ctrs
105
+ CKPT:
106
+ desc: null
107
+ value: logs/swint_0215_131156/wandb/latest-run/files/src/best_model.pth
108
+ MIX_INPUT:
109
+ desc: null
110
+ value:
111
+ ENABLE: true
112
+ NUM_MIX: 2
113
+ WEIGHTED: false
114
+ ATTENTION:
115
+ desc: null
116
+ value:
117
+ ENABLE: false
118
+ WEIGHTED_SAMPLE:
119
+ desc: null
120
+ value:
121
+ ENABLE: false
122
+ quantization:
123
+ desc: null
124
+ value:
125
+ method: jacob
126
+ weight:
127
+ num_bits: 8
128
+ axis: per_channel
129
+ calib_method: max
130
+ activation:
131
+ num_bits: 8
132
+ axis: per_tensor
133
+ calib_method: max
134
+ calibration:
135
+ num_batch: 2
136
+ modal: rgbd
137
+ pre_calibration: false
138
+ cmd:
139
+ desc: null
140
+ value: run.py --phase=train_ctrs --config=configs/scannet/swint_mix_ctrs.yaml --quant_config=quantization_configs/d2_jacob.yaml
141
+ _wandb:
142
+ desc: null
143
+ value:
144
+ code_path: code/run.py
145
+ python_version: 3.10.13
146
+ cli_version: 0.16.3
147
+ framework: huggingface
148
+ huggingface_version: 4.37.2
149
+ is_jupyter_run: false
150
+ is_kaggle_kernel: false
151
+ start_time: 1708267055.144142
152
+ t:
153
+ 1:
154
+ - 1
155
+ - 5
156
+ - 11
157
+ - 41
158
+ - 49
159
+ - 53
160
+ - 55
161
+ - 63
162
+ - 80
163
+ 2:
164
+ - 1
165
+ - 5
166
+ - 11
167
+ - 41
168
+ - 49
169
+ - 53
170
+ - 55
171
+ - 63
172
+ - 80
173
+ 3:
174
+ - 3
175
+ - 13
176
+ - 16
177
+ - 23
178
+ 4: 3.10.13
179
+ 5: 0.16.3
180
+ 6: 4.37.2
181
+ 8:
182
+ - 5
183
+ 13: linux-x86_64
swint_scannet/wandb/latest-run/files/src/best_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7653097d1ef33034928281bdeab5a5a17f0842757e51775be73b30dc05812b2
3
+ size 200253173
swint_scannet/wandb/latest-run/files/src/swint_mix_ctrs.yaml ADDED
@@ -0,0 +1,95 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ CONFIG: swint_mix_ctrs.yaml
2
+ FUSED_WINDOW_PROCESS: False
3
+ MODEL:
4
+ TYPE: swin
5
+ NAME: swin_tiny_patch4_window7_224
6
+ DROP_PATH_RATE: 0.3
7
+ DROP_RATE: 0.0
8
+ NUM_CLASSES: 1000
9
+ PRETRAINED: pretrained_weights/swin_tiny_patch4_window7_224.pth
10
+
11
+ SWIN:
12
+ EMBED_DIM: 96
13
+ DEPTHS: [ 2, 2, 18, 2 ]
14
+ NUM_HEADS: [ 3, 6, 12, 24 ]
15
+ WINDOW_SIZE: 7
16
+ PATCH_SIZE: 4
17
+ IN_CHANS: 3
18
+ MLP_RATIO: 4.0
19
+ QK_SCALE:
20
+ QKV_BIAS: True
21
+ APE: False
22
+ PATCH_NORM: True
23
+
24
+ clip_dim: 1024
25
+
26
+
27
+ TRAIN:
28
+ EPOCHS: 120
29
+ WARMUP_EPOCHS: 0
30
+ USE_CHECKPOINT: False
31
+ BASE_LR: 1e-6
32
+ WEIGHT_DECAY: 1e-3
33
+ WARMUP_LR: 5e-7
34
+ MIN_LR: 5e-7
35
+ CLIP_GRAD: 5.0
36
+ LR_SCHEDULER:
37
+ NAME: "cosine"
38
+ DECAY_EPOCHS: 30
39
+ DECAY_RATE: 0.1
40
+ MULTISTEPS: []
41
+ WARMUP_PREFIX: True
42
+ OPTIMIZER:
43
+ NAME: "adamw"
44
+ EPS: 1e-8
45
+ BETAS: [0.9, 0.999]
46
+ MOMENTUM: 0.9
47
+ CRETERION:
48
+ NAME: "TripletMarginLoss" # MSE
49
+ TRIPLET_MARGIN: 0.3
50
+ MINING_METHOD:
51
+ POSITIVE: "easy" # easy, hard, random
52
+ NEGATIVE: "random" # easy, hard, random
53
+ TOTAL: "semihard" # all, semihard, hard
54
+ NEG_NUM: 3
55
+ KD:
56
+ ENABLE: False
57
+ WEIGHT: 10
58
+ WEIGHT: 5e-2
59
+
60
+ DATA:
61
+ DATASET: "scannet"
62
+ IMG_SIZE: 224
63
+ ROOT: "dbs"
64
+ BATCH_SIZE: 4
65
+ VAL_BATCH_SIZE: 32
66
+ EMBEDDING_BATCH_SIZE: 32
67
+ DEPTH_TRANSFORM: "rgb"
68
+ LABEL_TYPE: "pseudo_labels" # "gt" or "clip_vitb32"
69
+ IS_SUBSET: True
70
+ DATASET_THRESHOLD: 0.25
71
+
72
+
73
+ GPU: 0
74
+ SEED: 1
75
+ CLIP_MODEL:
76
+ NAME: "ViT-g-14" # "ViT-B/32"
77
+ PRETRAINED: "laion2b_s34b_b88k"
78
+ MODAL: "depth" # "rgb" or "depth"
79
+ PHASE: "train_ctrs" # "train_ctrs" # "test"
80
+ CKPT: "logs/swint_0215_131156/wandb/latest-run/files/src/best_model.pth"
81
+
82
+ # [] Mix Input
83
+ MIX_INPUT:
84
+ ENABLE: True
85
+ NUM_MIX: 2
86
+ WEIGHTED: False
87
+
88
+ # [] Attention
89
+ ATTENTION:
90
+ ENABLE: False
91
+
92
+ # [] Weighted samples
93
+ WEIGHTED_SAMPLE:
94
+ ENABLE: False
95
+