timm
/

Image Classification
timm
PyTorch
Safetensors
rwightman HF staff commited on
Commit
c5bb4cb
1 Parent(s): b574410

Upload train_hparams.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. train_hparams.yaml +133 -0
train_hparams.yaml ADDED
@@ -0,0 +1,133 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ aa: rand-m7-inc1-mstd1.0-n3
2
+ amp: true
3
+ amp_dtype: float16
4
+ amp_impl: native
5
+ aug_repeats: 3.0
6
+ aug_splits: 0
7
+ batch_size: 256
8
+ bce_loss: false
9
+ bce_target_thresh: null
10
+ bn_eps: null
11
+ bn_momentum: null
12
+ channels_last: false
13
+ checkpoint_hist: 10
14
+ class_map: ''
15
+ clip_grad: 5.0
16
+ clip_mode: norm
17
+ color_jitter: null
18
+ cooldown_epochs: 10
19
+ crop_pct: 0.95
20
+ cutmix: 1.0
21
+ cutmix_minmax: null
22
+ data: null
23
+ data_dir: /data/imagenet/
24
+ dataset: imagenet
25
+ dataset_download: false
26
+ decay_epochs: 100
27
+ decay_milestones:
28
+ - 90
29
+ - 180
30
+ - 270
31
+ decay_rate: 0.1
32
+ dist_bn: reduce
33
+ drop: 0.0
34
+ drop_block: null
35
+ drop_connect: null
36
+ drop_path: 0.2
37
+ epoch_repeats: 0.0
38
+ epochs: 600
39
+ eval_metric: top1
40
+ experiment: ''
41
+ fast_norm: false
42
+ force_cpu: false
43
+ fuser: ''
44
+ gp: null
45
+ grad_accum_steps: 1
46
+ grad_checkpointing: false
47
+ head_init_bias: null
48
+ head_init_scale: null
49
+ hflip: 0.5
50
+ img_size: 256
51
+ in_chans: null
52
+ initial_checkpoint: ''
53
+ input_size: null
54
+ interpolation: ''
55
+ jsd_loss: false
56
+ layer_decay: null
57
+ local_rank: 0
58
+ log_interval: 50
59
+ log_wandb: false
60
+ lr: null
61
+ lr_base: 0.0008
62
+ lr_base_scale: ''
63
+ lr_base_size: 512
64
+ lr_cycle_decay: 0.5
65
+ lr_cycle_limit: 1
66
+ lr_cycle_mul: 1.0
67
+ lr_k_decay: 1.0
68
+ lr_noise: null
69
+ lr_noise_pct: 0.67
70
+ lr_noise_std: 1.0
71
+ mean: null
72
+ min_lr: 5.0e-07
73
+ mixup: 0.8
74
+ mixup_mode: batch
75
+ mixup_off_epoch: 0
76
+ mixup_prob: 1.0
77
+ mixup_switch_prob: 0.5
78
+ model: vit_betwixt_patch16_rope_reg4_gap_256
79
+ model_ema: false
80
+ model_ema_decay: 0.9998
81
+ model_ema_force_cpu: false
82
+ model_kwargs: {}
83
+ momentum: 0.9
84
+ no_aug: false
85
+ no_ddp_bb: false
86
+ no_prefetcher: false
87
+ no_resume_opt: false
88
+ num_classes: null
89
+ opt: nadamw
90
+ opt_betas: null
91
+ opt_eps: 1.0e-08
92
+ opt_kwargs: {}
93
+ output: ''
94
+ patience_epochs: 10
95
+ pin_mem: true
96
+ pretrained: false
97
+ ratio:
98
+ - 0.75
99
+ - 1.3333333333333333
100
+ recount: 1
101
+ recovery_interval: 0
102
+ remode: pixel
103
+ reprob: 0.2
104
+ resplit: false
105
+ resume: ''
106
+ save_images: false
107
+ scale:
108
+ - 0.08
109
+ - 1.0
110
+ sched: cosine
111
+ sched_on_updates: true
112
+ seed: 0
113
+ smoothing: 0.1
114
+ split_bn: false
115
+ start_epoch: null
116
+ std: null
117
+ sync_bn: false
118
+ synchronize_step: false
119
+ torchcompile: inductor
120
+ torchscript: false
121
+ train_interpolation: random
122
+ train_split: train
123
+ tta: 0
124
+ use_multi_epochs_loader: false
125
+ val_split: validation
126
+ validation_batch_size: null
127
+ vflip: 0.0
128
+ warmup_epochs: 20
129
+ warmup_lr: 5.0e-07
130
+ warmup_prefix: false
131
+ weight_decay: 0.08
132
+ worker_seeding: all
133
+ workers: 8