Spaces:
Sleeping
Sleeping
File size: 1,326 Bytes
2ada650 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 |
model:
arch: mini_gpt4_llama_v2
model_type: pretrain_vicuna
freeze_vit: True
freeze_qformer: True
max_txt_len: 512
low_resource: False
image_size: 224
end_sym: "</s>"
llama_model: "mistralai/Mistral-7B-Instruct-v0.2"
ckpt: "checkpoints/image_mistral_checkpoint.pth"
use_grad_checkpoint: True
chat_template: True
lora_r: 64
lora_alpha: 16
length: 50
use_grad_checkpoint_llm: True
max_context_len: 7200
datasets:
cmd_video: # 15938
batch_size: 1
vis_processor:
train:
name: "blip2_image_train"
image_size: 224
text_processor:
train:
name: "blip_caption"
sample_ratio: 100
webvid: # 42387
batch_size: 1
vis_processor:
train:
name: "blip2_image_train"
image_size: 224
text_processor:
train:
name: "blip_caption"
sample_ratio: 50
run:
task: image_text_pretrain
# optimizer
lr_sched: "linear_warmup_cosine_lr"
init_lr: 1e-4
min_lr: 8e-5
warmup_lr: 1e-6
weight_decay: 0.05
max_epoch: 50
num_workers: 16
warmup_steps: 875
iters_per_epoch: 875
seed: 42
output_dir: "training_output/cmd_webvid_pretrain"
amp: True
resume_ckpt_path: null
evaluate: False
train_splits: ["train"]
device: "cuda"
world_size: 1
dist_url: "env://"
distributed: True
|