timm
/

Image Classification
timm
PyTorch
Safetensors
rwightman HF staff commited on
Commit
7f00ccb
1 Parent(s): 84a41ee

Upload train_hparams.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. train_hparams.yaml +148 -0
train_hparams.yaml ADDED
@@ -0,0 +1,148 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ aa: rand-m7-inc1-mstd1.0-n3
2
+ amp: true
3
+ amp_dtype: float16
4
+ amp_impl: native
5
+ aug_repeats: 0.0
6
+ aug_splits: 0
7
+ batch_size: 256
8
+ bce_loss: false
9
+ bce_pos_weight: null
10
+ bce_sum: false
11
+ bce_target_thresh: null
12
+ bn_eps: null
13
+ bn_momentum: null
14
+ channels_last: false
15
+ checkpoint_hist: 10
16
+ class_map: ''
17
+ clip_grad: 5.0
18
+ clip_mode: norm
19
+ color_jitter: null
20
+ color_jitter_prob: null
21
+ cooldown_epochs: 10
22
+ crop_pct: 0.95
23
+ cutmix: 0.8
24
+ cutmix_minmax: null
25
+ data: null
26
+ data_dir: /data/imagenet/
27
+ dataset: imagenet
28
+ dataset_download: false
29
+ decay_epochs: 100
30
+ decay_milestones:
31
+ - 90
32
+ - 180
33
+ - 270
34
+ decay_rate: 0.1
35
+ device: cuda
36
+ device_modules: null
37
+ dist_bn: reduce
38
+ drop: 0.0
39
+ drop_block: null
40
+ drop_connect: null
41
+ drop_path: 0.2
42
+ epoch_repeats: 0.0
43
+ epochs: 60
44
+ eval_metric: top1
45
+ experiment: ''
46
+ fast_norm: false
47
+ force_cpu: false
48
+ fuser: ''
49
+ gaussian_blur_prob: null
50
+ gp: null
51
+ grad_accum_steps: 1
52
+ grad_checkpointing: false
53
+ grayscale_prob: null
54
+ head_init_bias: null
55
+ head_init_scale: 0.0
56
+ hflip: 0.5
57
+ img_size: 256
58
+ in_chans: null
59
+ initial_checkpoint: ''
60
+ input_img_mode: null
61
+ input_key: null
62
+ input_size: null
63
+ interpolation: ''
64
+ jsd_loss: false
65
+ layer_decay: 0.75
66
+ local_rank: 0
67
+ log_interval: 50
68
+ log_wandb: false
69
+ lr: 0.0001
70
+ lr_base: 0.0008
71
+ lr_base_scale: ''
72
+ lr_base_size: 512
73
+ lr_cycle_decay: 0.5
74
+ lr_cycle_limit: 1
75
+ lr_cycle_mul: 1.0
76
+ lr_k_decay: 1.0
77
+ lr_noise: null
78
+ lr_noise_pct: 0.67
79
+ lr_noise_std: 1.0
80
+ mean: null
81
+ min_lr: 5.0e-07
82
+ mixup: 0.2
83
+ mixup_mode: batch
84
+ mixup_off_epoch: 0
85
+ mixup_prob: 1.0
86
+ mixup_switch_prob: 0.5
87
+ model: vit_betwixt_patch16_reg4_gap_256
88
+ model_ema: true
89
+ model_ema_decay: 0.999
90
+ model_ema_force_cpu: false
91
+ model_ema_warmup: false
92
+ model_kwargs: {}
93
+ momentum: 0.9
94
+ no_aug: false
95
+ no_ddp_bb: false
96
+ no_prefetcher: false
97
+ no_resume_opt: false
98
+ num_classes: 1000
99
+ opt: adamw
100
+ opt_betas: null
101
+ opt_eps: 1.0e-08
102
+ opt_kwargs: {}
103
+ output: ''
104
+ patience_epochs: 10
105
+ pin_mem: true
106
+ pretrained: true
107
+ pretrained_path: vit_betw-in12k-8.pth
108
+ ratio:
109
+ - 0.75
110
+ - 1.3333333333333333
111
+ recount: 1
112
+ recovery_interval: 0
113
+ remode: pixel
114
+ reprob: 0.2
115
+ resplit: false
116
+ resume: ''
117
+ save_images: false
118
+ scale:
119
+ - 0.08
120
+ - 1.0
121
+ sched: cosine
122
+ sched_on_updates: true
123
+ seed: 0
124
+ smoothing: 0.1
125
+ split_bn: false
126
+ start_epoch: null
127
+ std: null
128
+ sync_bn: false
129
+ synchronize_step: false
130
+ target_key: null
131
+ torchcompile: inductor
132
+ torchscript: false
133
+ train_crop_mode: null
134
+ train_interpolation: random
135
+ train_num_samples: null
136
+ train_split: train
137
+ tta: 0
138
+ use_multi_epochs_loader: false
139
+ val_num_samples: null
140
+ val_split: validation
141
+ validation_batch_size: null
142
+ vflip: 0.0
143
+ warmup_epochs: 20
144
+ warmup_lr: 5.0e-07
145
+ warmup_prefix: false
146
+ weight_decay: 0.01
147
+ worker_seeding: all
148
+ workers: 8