ahatamiz commited on
Commit
dca3fec
1 Parent(s): 08e03e6

Create config.json

Browse files
Files changed (1) hide show
  1. config.json +151 -0
config.json ADDED
@@ -0,0 +1,151 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "MambaVision"
4
+ ],
5
+ "args": {
6
+ "ThreeAugment": false,
7
+ "aa": "rand-m9-mstd0.5-inc1",
8
+ "activation_tracker": false,
9
+ "amp": true,
10
+ "ampere_sparsity": false,
11
+ "aot_autograd": false,
12
+ "apex_amp": false,
13
+ "attn_drop_rate": 0,
14
+ "aug_repeats": 0,
15
+ "aug_splits": 0,
16
+ "batch_size": 128,
17
+ "bce_loss": false,
18
+ "bce_target_thresh": null,
19
+ "bn_eps": null,
20
+ "bn_momentum": null,
21
+ "channels_last": true,
22
+ "checkpoint_hist": 1,
23
+ "class_map": "",
24
+ "clip_grad": 5,
25
+ "clip_mode": "norm",
26
+ "color_jitter": 0.4,
27
+ "cooldown_epochs": 10,
28
+ "crop_pct": 1,
29
+ "cutmix": 1,
30
+ "cutmix_minmax": null,
31
+ "data_dir": "/datasets/imagenet_lmdb",
32
+ "data_len": 1281167,
33
+ "dataset": "",
34
+ "dataset_download": false,
35
+ "decay_epochs": 100,
36
+ "decay_milestones": [
37
+ 30,
38
+ 60
39
+ ],
40
+ "decay_rate": 0.1,
41
+ "dist_bn": "reduce",
42
+ "drop_block": null,
43
+ "drop_connect": null,
44
+ "drop_path": null,
45
+ "drop_rate": 0,
46
+ "epoch_repeats": 0,
47
+ "epochs": 310,
48
+ "eval_metric": "top1",
49
+ "experiment": "",
50
+ "fuser": "",
51
+ "gp": null,
52
+ "grad_checkpointing": false,
53
+ "hflip": 0.5,
54
+ "img_size": null,
55
+ "initial_checkpoint": "",
56
+ "input_size": [
57
+ 3,
58
+ 224,
59
+ 224
60
+ ],
61
+ "interpolation": "",
62
+ "jsd_loss": false,
63
+ "layer_decay": null,
64
+ "checkpoint": "",
65
+ "local_rank": 0,
66
+ "log_dir": "./log_dir/",
67
+ "log_interval": 50,
68
+ "log_wandb": false,
69
+ "lr": 0.005,
70
+ "lr_cycle_decay": 1,
71
+ "lr_cycle_limit": 1,
72
+ "lr_cycle_mul": 1,
73
+ "lr_ep": false,
74
+ "lr_k_decay": 1,
75
+ "lr_noise": null,
76
+ "lr_noise_pct": 0.67,
77
+ "lr_noise_std": 1,
78
+ "mean": null,
79
+ "mesa": 0.5,
80
+ "mesa_start_ratio": 0.25,
81
+ "min_lr": 0.000005,
82
+ "mixup": 0.8,
83
+ "mixup_mode": "batch",
84
+ "mixup_off_epoch": 0,
85
+ "mixup_prob": 1,
86
+ "mixup_switch_prob": 0.5,
87
+ "model": "mamba_vision_L2",
88
+ "model_ema": true,
89
+ "model_ema_decay": 0.9998,
90
+ "model_ema_force_cpu": false,
91
+ "momentum": 0.9,
92
+ "native_amp": false,
93
+ "no_aug": false,
94
+ "no_ddp_bb": false,
95
+ "no_prefetcher": false,
96
+ "no_resume_opt": false,
97
+ "no_saver": false,
98
+ "num_classes": null,
99
+ "opt": "lamb",
100
+ "opt_betas": [
101
+ 0.9,
102
+ 0.999
103
+ ],
104
+ "opt_eps": 1e-8,
105
+ "output": "",
106
+ "patience_epochs": 10,
107
+ "pin_mem": false,
108
+ "pretrained": false,
109
+ "ratio": [
110
+ 0.75,
111
+ 1.3333333333333333
112
+ ],
113
+ "recount": 1,
114
+ "recovery_interval": 0,
115
+ "remode": "pixel",
116
+ "reprob": 0.25,
117
+ "resplit": false,
118
+ "resume": "",
119
+ "save_images": false,
120
+ "scale": [
121
+ 0.08,
122
+ 1
123
+ ],
124
+ "sched": "cosine",
125
+ "seed": 31,
126
+ "smoothing": 0.1,
127
+ "split_bn": false,
128
+ "start_epoch": null,
129
+ "std": null,
130
+ "sync_bn": false,
131
+ "tag": "mambavision_large2_1k",
132
+ "torchscript": false,
133
+ "train_interpolation": "random",
134
+ "train_split": "train",
135
+ "tta": 0,
136
+ "use_multi_epochs_loader": false,
137
+ "val_split": "validation",
138
+ "validate_only": false,
139
+ "validation_batch_size": null,
140
+ "vflip": 0,
141
+ "warmup_epochs": 20,
142
+ "warmup_lr": 0.000001,
143
+ "weight_decay": 0.05,
144
+ "worker_seeding": "all",
145
+ "workers": 8
146
+ },
147
+ "auto_map": {
148
+ "AutoConfig": "hf_model.MambaVisionConfig",
149
+ "AutoModel": "hf_model.MambaVisionModel"
150
+ }
151
+ }