|
|
|
$GPU_MEMORY_THRESHOLD = 0.85 |
|
$GPU_CHECK_INTERVAL = 50 |
|
|
|
|
|
$PHASE1_CKPT = "logs/model_glen_vault/GLEN_P1_base" |
|
|
|
|
|
$env:CUDA_VISIBLE_DEVICES = "0" |
|
|
|
|
|
python examples/glen_phase2/train_glen.py ` |
|
--output_dir logs/model_glen_vault/GLEN_P2_base ` |
|
--model_name_or_path $PHASE1_CKPT ` |
|
--load_best_model_at_end True ` |
|
--per_device_train_batch_size 4 ` |
|
--per_device_eval_batch_size 2 ` |
|
--gradient_accumulation_steps 32 ` |
|
--dropout_rate 0.1 ` |
|
--warmup_ratio 0.1 ` |
|
--id_class t5_bm25_truncate_3 ` |
|
--dataset_name the_vault ` |
|
--test100 1 ` |
|
--tree 1 ` |
|
--q_max_len 32 ` |
|
--p_max_len 256 ` |
|
--negative_passage_type self ` |
|
--positive_passage_no_shuffle True ` |
|
--tie_word_embeddings True ` |
|
--num_return_sequences 10 ` |
|
--logging_steps 100 ` |
|
--overwrite_output_dir ` |
|
--wandb_tag glen_vault_p2 ` |
|
--do_eval ` |
|
--seed 42 ` |
|
--gpu_memory_threshold $GPU_MEMORY_THRESHOLD ` |
|
--gpu_check_interval $GPU_CHECK_INTERVAL ` |
|
--fp16 True ` |
|
--gradient_checkpointing True |