|
accum_freq: 1 |
|
aug_cfg: {} |
|
batch_size: 938 |
|
beta1: 0.9 |
|
beta2: 0.98 |
|
checkpoint_path: /tmp/cumulative_sequential_2016/datacomp_xlarge-basic-2023-09-12_05-47-41_cumulative_seq_2016/checkpoints |
|
coca_caption_loss_weight: 2.0 |
|
coca_contrastive_loss_weight: 1.0 |
|
copy_codebase: False |
|
csv_caption_key: title |
|
csv_img_key: filepath |
|
csv_separator: |
|
dataset_resampled: True |
|
dataset_type: webdataset |
|
ddp_static_graph: True |
|
debug: False |
|
decay_fraction: 0.2 |
|
delete_previous_checkpoint: False |
|
device: cuda:0 |
|
dist_backend: nccl |
|
dist_url: env:// |
|
distill: False |
|
distill_model: None |
|
distill_pretrained: None |
|
distributed: True |
|
epochs: 32 |
|
epochs_cooldown: None |
|
eps: 1e-06 |
|
force_custom_text: False |
|
force_image_size: None |
|
force_patch_dropout: None |
|
force_qk_norm: False |
|
force_qk_norm_eps: 1e-05 |
|
force_quick_gelu: False |
|
gather_with_grad: True |
|
grad_checkpointing: True |
|
grad_clip_norm: None |
|
horovod: False |
|
image_mean: None |
|
image_std: None |
|
imagenet_v2: None |
|
imagenet_val: ../imagenet_validation |
|
is_iteration_based: True |
|
local_loss: True |
|
local_rank: 0 |
|
lock_image: False |
|
lock_image_freeze_bn_stats: False |
|
lock_image_unlocked_groups: 0 |
|
lock_text: False |
|
lock_text_freeze_layer_norm: False |
|
lock_text_unlocked_layers: 0 |
|
log_every_n_steps: 100 |
|
log_level: 20 |
|
log_local: False |
|
log_path: /tmp/cumulative_sequential_2016/datacomp_xlarge-basic-2023-09-12_05-47-41_cumulative_seq_2016/out.log |
|
logs: /tmp/cumulative_sequential_2016 |
|
lr: 0.001 |
|
lr_cooldown_end: 0.0 |
|
lr_cooldown_power: 1.0 |
|
lr_scheduler: cosine |
|
max_iterations: 20500 |
|
model: ViT-B-16 |
|
name: datacomp_xlarge-basic-2023-09-12_05-47-41_cumulative_seq_2016 |
|
no_set_device_rank: False |
|
precision: amp |
|
pretrained: |
|
pretrained_image: False |
|
rank: 0 |
|
remote_sync: xlarge_CL_basic_filter/cumulative_sequential_2016/ |
|
remote_sync_frequency: 300 |
|
remote_sync_protocol: s3 |
|
report_to: wandb |
|
resume: xlarge_CL_basic_filter/cumulative_sequential_2016/datacomp_xlarge-basic-2023-09-11_12-08-12_cumulative_seq_2016/checkpoints/epoch_4.pt |
|
save_frequency: 1 |
|
save_most_recent: True |
|
seed: 0 |
|
skip_scheduler: False |
|
tensorboard: False |
|
tensorboard_path: |
|
torchcompile: False |
|
torchscript: False |
|
trace: False |
|
train_data: xlarge_basic_filter/2016/1/{00000000..00000255}.tar::xlarge_basic_filter/2016/10/{00000000..00000255}.tar::xlarge_basic_filter/2016/11/{00000000..00000255}.tar::xlarge_basic_filter/2016/12/{00000000..00000239}.tar::xlarge_basic_filter/2016/13/{00000000..00000239}.tar::xlarge_basic_filter/2016/14/{00000000..00000255}.tar::xlarge_basic_filter/2016/15/{00000000..00000239}.tar::xlarge_basic_filter/2016/16/{00000000..00000255}.tar::xlarge_basic_filter/2016/17/{00000000..00000255}.tar::xlarge_basic_filter/2016/18/{00000000..00000239}.tar::xlarge_basic_filter/2016/19/{00000000..00000239}.tar::xlarge_basic_filter/2016/2/{00000000..00000255}.tar::xlarge_basic_filter/2016/20/{00000000..00000239}.tar::xlarge_basic_filter/2016/21/{00000000..00000238}.tar::xlarge_basic_filter/2016/22/{00000000..00000251}.tar::xlarge_basic_filter/2016/23/{00000000..00000255}.tar::xlarge_basic_filter/2016/24/{00000000..00000191}.tar::xlarge_basic_filter/2016/25/{00000000..00000191}.tar::xlarge_basic_filter/2016/26/{00000000..00000039}.tar::xlarge_basic_filter/2016/27/{00000000..00000073}.tar::xlarge_basic_filter/2016/28/{00000000..00000279}.tar::xlarge_basic_filter/2016/29/{00000000..00000319}.tar::xlarge_basic_filter/2016/3/{00000000..00000255}.tar::xlarge_basic_filter/2016/30/{00000000..00000276}.tar::xlarge_basic_filter/2016/31/{00000000..00000279}.tar::xlarge_basic_filter/2016/32/{00000000..00000317}.tar::xlarge_basic_filter/2016/33/{00000000..00000317}.tar::xlarge_basic_filter/2016/34/{00000000..00000279}.tar::xlarge_basic_filter/2016/35/{00000000..00000255}.tar::xlarge_basic_filter/2016/36/{00000000..00000319}.tar::xlarge_basic_filter/2016/37/{00000000..00000279}.tar::xlarge_basic_filter/2016/38/{00000000..00000239}.tar::xlarge_basic_filter/2016/39/{00000000..00000255}.tar::xlarge_basic_filter/2016/4/{00000000..00000255}.tar::xlarge_basic_filter/2016/40/{00000000..00000255}.tar::xlarge_basic_filter/2016/41/{00000000..00000210}.tar::xlarge_basic_filter/2016/42/{00000000..00000255}.tar::xlarge_basic_filter/2016/43/{00000000..00000255}.tar::xlarge_basic_filter/2016/44/{00000000..00000279}.tar::xlarge_basic_filter/2016/45/{00000000..00000255}.tar::xlarge_basic_filter/2016/46/{00000000..00000255}.tar::xlarge_basic_filter/2016/47/{00000000..00000269}.tar::xlarge_basic_filter/2016/48/{00000000..00000319}.tar::xlarge_basic_filter/2016/49/{00000000..00000319}.tar::xlarge_basic_filter/2016/5/{00000000..00000255}.tar::xlarge_basic_filter/2016/50/{00000000..00000317}.tar::xlarge_basic_filter/2016/51/{00000000..00000319}.tar::xlarge_basic_filter/2016/52/{00000000..00000319}.tar::xlarge_basic_filter/2016/53/{00000000..00000439}.tar::xlarge_basic_filter/2016/54/{00000000..00000447}.tar::xlarge_basic_filter/2016/55/{00000000..00000187}.tar::xlarge_basic_filter/2016/56/{00000000..00000181}.tar::xlarge_basic_filter/2016/57/{00000000..00000137}.tar::xlarge_basic_filter/2016/58/{00000000..00000127}.tar::xlarge_basic_filter/2016/59/{00000000..00000127}.tar::xlarge_basic_filter/2016/6/{00000000..00000255}.tar::xlarge_basic_filter/2016/7/{00000000..00000279}.tar::xlarge_basic_filter/2016/8/{00000000..00000239}.tar::xlarge_basic_filter/2016/9/{00000000..00000255}.tar::xlarge_basic_filter/2015/0/{00000000..00000127}.tar::xlarge_basic_filter/2015/1/{00000000..00000127}.tar::xlarge_basic_filter/2015/10/{00000000..00000127}.tar::xlarge_basic_filter/2015/11/{00000000..00000127}.tar::xlarge_basic_filter/2015/12/{00000000..00000127}.tar::xlarge_basic_filter/2015/13/{00000000..00000127}.tar::xlarge_basic_filter/2015/14/{00000000..00000127}.tar::xlarge_basic_filter/2015/15/{00000000..00000127}.tar::xlarge_basic_filter/2015/16/{00000000..00000127}.tar::xlarge_basic_filter/2015/17/{00000000..00000127}.tar::xlarge_basic_filter/2015/18/{00000000..00000127}.tar::xlarge_basic_filter/2015/19/{00000000..00000127}.tar::xlarge_basic_filter/2015/2/{00000000..00000127}.tar::xlarge_basic_filter/2015/20/{00000000..00000127}.tar::xlarge_basic_filter/2015/21/{00000000..00000079}.tar::xlarge_basic_filter/2015/22/{00000000..00000079}.tar::xlarge_basic_filter/2015/23/{00000000..00000119}.tar::xlarge_basic_filter/2015/24/{00000000..00000079}.tar::xlarge_basic_filter/2015/25/{00000000..00000079}.tar::xlarge_basic_filter/2015/26/{00000000..00000063}.tar::xlarge_basic_filter/2015/27/{00000000..00000063}.tar::xlarge_basic_filter/2015/28/{00000000..00000127}.tar::xlarge_basic_filter/2015/29/{00000000..00000127}.tar::xlarge_basic_filter/2015/3/{00000000..00000127}.tar::xlarge_basic_filter/2015/30/{00000000..00000127}.tar::xlarge_basic_filter/2015/31/{00000000..00000127}.tar::xlarge_basic_filter/2015/32/{00000000..00000127}.tar::xlarge_basic_filter/2015/33/{00000000..00000119}.tar::xlarge_basic_filter/2015/34/{00000000..00000119}.tar::xlarge_basic_filter/2015/35/{00000000..00000127}.tar::xlarge_basic_filter/2015/36/{00000000..00000127}.tar::xlarge_basic_filter/2015/37/{00000000..00000119}.tar::xlarge_basic_filter/2015/38/{00000000..00000127}.tar::xlarge_basic_filter/2015/39/{00000000..00000127}.tar::xlarge_basic_filter/2015/4/{00000000..00000127}.tar::xlarge_basic_filter/2015/40/{00000000..00000119}.tar::xlarge_basic_filter/2015/41/{00000000..00000079}.tar::xlarge_basic_filter/2015/42/{00000000..00000119}.tar::xlarge_basic_filter/2015/43/{00000000..00000119}.tar::xlarge_basic_filter/2015/44/{00000000..00000127}.tar::xlarge_basic_filter/2015/45/{00000000..00000127}.tar::xlarge_basic_filter/2015/46/{00000000..00000127}.tar::xlarge_basic_filter/2015/47/{00000000..00000127}.tar::xlarge_basic_filter/2015/48/{00000000..00000127}.tar::xlarge_basic_filter/2015/49/{00000000..00000119}.tar::xlarge_basic_filter/2015/5/{00000000..00000127}.tar::xlarge_basic_filter/2015/50/{00000000..00000127}.tar::xlarge_basic_filter/2015/51/{00000000..00000119}.tar::xlarge_basic_filter/2015/52/{00000000..00000127}.tar::xlarge_basic_filter/2015/53/{00000000..00000199}.tar::xlarge_basic_filter/2015/54/{00000000..00000159}.tar::xlarge_basic_filter/2015/55/{00000000..00000079}.tar::xlarge_basic_filter/2015/56/{00000000..00000063}.tar::xlarge_basic_filter/2015/57/{00000000..00000063}.tar::xlarge_basic_filter/2015/58/{00000000..00000079}.tar::xlarge_basic_filter/2015/59/{00000000..00000063}.tar::xlarge_basic_filter/2015/6/{00000000..00000127}.tar::xlarge_basic_filter/2015/7/{00000000..00000127}.tar::xlarge_basic_filter/2015/8/{00000000..00000127}.tar::xlarge_basic_filter/2015/9/{00000000..00000127}.tar::xlarge_basic_filter/2014/0/{00000000..00000127}.tar::xlarge_basic_filter/2014/1/{00000000..00000127}.tar::xlarge_basic_filter/2014/10/{00000000..00000098}.tar::xlarge_basic_filter/2014/11/{00000000..00000127}.tar::xlarge_basic_filter/2014/12/{00000000..00000127}.tar::xlarge_basic_filter/2014/13/{00000000..00000127}.tar::xlarge_basic_filter/2014/14/{00000000..00000127}.tar::xlarge_basic_filter/2014/15/{00000000..00000127}.tar::xlarge_basic_filter/2014/16/{00000000..00000105}.tar::xlarge_basic_filter/2014/17/{00000000..00000127}.tar::xlarge_basic_filter/2014/18/{00000000..00000127}.tar::xlarge_basic_filter/2014/19/{00000000..00000127}.tar::xlarge_basic_filter/2014/2/{00000000..00000127}.tar::xlarge_basic_filter/2014/20/{00000000..00000119}.tar::xlarge_basic_filter/2014/21/{00000000..00000127}.tar::xlarge_basic_filter/2014/22/{00000000..00000079}.tar::xlarge_basic_filter/2014/23/{00000000..00000127}.tar::xlarge_basic_filter/2014/24/{00000000..00000063}.tar::xlarge_basic_filter/2014/25/{00000000..00000063}.tar::xlarge_basic_filter/2014/26/{00000000..00000063}.tar::xlarge_basic_filter/2014/27/{00000000..00000063}.tar::xlarge_basic_filter/2014/28/{00000000..00000127}.tar::xlarge_basic_filter/2014/29/{00000000..00000127}.tar::xlarge_basic_filter/2014/3/{00000000..00000127}.tar::xlarge_basic_filter/2014/30/{00000000..00000127}.tar::xlarge_basic_filter/2014/31/{00000000..00000127}.tar::xlarge_basic_filter/2014/32/{00000000..00000127}.tar::xlarge_basic_filter/2014/33/{00000000..00000127}.tar::xlarge_basic_filter/2014/34/{00000000..00000127}.tar::xlarge_basic_filter/2014/35/{00000000..00000127}.tar::xlarge_basic_filter/2014/36/{00000000..00000127}.tar::xlarge_basic_filter/2014/37/{00000000..00000127}.tar::xlarge_basic_filter/2014/38/{00000000..00000127}.tar::xlarge_basic_filter/2014/39/{00000000..00000127}.tar::xlarge_basic_filter/2014/4/{00000000..00000119}.tar::xlarge_basic_filter/2014/40/{00000000..00000127}.tar::xlarge_basic_filter/2014/41/{00000000..00000127}.tar::xlarge_basic_filter/2014/42/{00000000..00000127}.tar::xlarge_basic_filter/2014/43/{00000000..00000127}.tar::xlarge_basic_filter/2014/44/{00000000..00000127}.tar::xlarge_basic_filter/2014/45/{00000000..00000127}.tar::xlarge_basic_filter/2014/46/{00000000..00000127}.tar::xlarge_basic_filter/2014/47/{00000000..00000127}.tar::xlarge_basic_filter/2014/48/{00000000..00000127}.tar::xlarge_basic_filter/2014/49/{00000000..00000127}.tar::xlarge_basic_filter/2014/5/{00000000..00000119}.tar::xlarge_basic_filter/2014/50/{00000000..00000127}.tar::xlarge_basic_filter/2014/51/{00000000..00000127}.tar::xlarge_basic_filter/2014/52/{00000000..00000127}.tar::xlarge_basic_filter/2014/53/{00000000..00000191}.tar::xlarge_basic_filter/2014/54/{00000000..00000191}.tar::xlarge_basic_filter/2014/55/{00000000..00000063}.tar::xlarge_basic_filter/2014/56/{00000000..00000063}.tar::xlarge_basic_filter/2014/57/{00000000..00000063}.tar::xlarge_basic_filter/2014/58/{00000000..00000063}.tar::xlarge_basic_filter/2014/59/{00000000..00000063}.tar::xlarge_basic_filter/2014/6/{00000000..00000127}.tar::xlarge_basic_filter/2014/7/{00000000..00000127}.tar::xlarge_basic_filter/2014/8/{00000000..00000119}.tar::xlarge_basic_filter/2014/9/{00000000..00000117}.tar |
|
train_data_upsampling_factors: None |
|
train_num_samples: None |
|
use_bn_sync: False |
|
use_bnb_linear: None |
|
val_data: None |
|
val_frequency: 1 |
|
val_num_samples: None |
|
wandb: True |
|
wandb_notes: |
|
wandb_project_name: datacomp-xlarge-CL |
|
warmup: 10000 |
|
wd: 0.2 |
|
workers: 4 |
|
world_size: 96 |
|
zeroshot_frequency: 2 |
|
|