arch: vit_small backend: nccl batch_size_per_gpu: 100 clip_grad: 0.0 data_path: /path/to/imagenet/ dist_url: env:// drop_path_rate: 0.1 epochs: 100 eval_every: 30 freeze_last_layer: 1 gamma: null global_crops_scale: - 0.25 - 1.0 local_crops_number: 6 local_crops_scale: - 0.05 - 0.25 local_rank: 0 lr: 0.0005 min_lr: 1.0e-05 mode: simpool momentum_teacher: 0.996 nb_knn: - 10 - 20 - 100 - 200 norm_last_layer: false num_workers: 10 optimizer: adamw out_dim: 65536 output_dir: /path/to/output/ patch_size: 16 saveckp_freq: 20 seed: 0 subset: -1 teacher_temp: 0.07 temperature: 0.07 use_bn_in_head: false use_fp16: false warmup_epochs: 10 warmup_teacher_temp: 0.04 warmup_teacher_temp_epochs: 30 weight_decay: 0.04 weight_decay_end: 0.4