| { | |
| "batch_size": 8, | |
| "accum_iter": 1, | |
| "epochs": 40, | |
| "warmup_epochs": 0.01, | |
| "lr": 5e-06, | |
| "min_lr": 5e-06, | |
| "wd": 0.1, | |
| "clip_grad": 4.0, | |
| "init_from": null, | |
| "data_config": "/path/to/data/config/yaml", | |
| "data_config_train": "configs/libero_ck_all/his_2_train_object_img_only_ck_5_1a2i_all.yaml", | |
| "data_config_val_ind": "configs/libero_ck/his_2_val_ind_object_img_only_ck_5_1a2i.yaml", | |
| "data_config_val_ood": "configs/libero_ck/his_2_val_ood_object_img_only_ck_5_1a2i.yaml", | |
| "cache_ann_on_disk": true, | |
| "length_clustering": false, | |
| "num_workers": 8, | |
| "pin_mem": true, | |
| "seed": 0, | |
| "output_dir": "output_dis_libero_ck_all/libero_ts_object_his2imgonly_lr5e6_bs8_ck_5_1a2i_w004_all", | |
| "save_interval": 1, | |
| "save_iteration_interval": 5000, | |
| "only_save_trainable": false, | |
| "ckpt_max_keep": 0, | |
| "auto_resume": true, | |
| "resume_path": null, | |
| "model_parallel_size": 1, | |
| "data_parallel": "fsdp", | |
| "precision": "bf16", | |
| "grad_precision": "fp32", | |
| "checkpointing": true, | |
| "eval_only": false, | |
| "ft": false, | |
| "ablation": "0", | |
| "max_seq_len": 4096, | |
| "mask_image_logits": false, | |
| "dropout": 0.05, | |
| "z_loss_weight": 1e-05, | |
| "model_size": "7B", | |
| "world_size": 16, | |
| "rank": 0, | |
| "gpu": 0, | |
| "local_rank": 0, | |
| "dist_url": "env://", | |
| "distributed": true, | |
| "dist_backend": "nccl" | |
| } |