|
|
#!/usr/bin/env bash |
|
|
set -euo pipefail |
|
|
|
|
|
|
|
|
mkdir -p /pfs/lichenyi/work/evaluation/predictions_in |
|
|
mkdir -p /pfs/lichenyi/work/evaluation/predictions_ood |
|
|
|
|
|
for i in 100 200 300 400 500 600 700 748; do |
|
|
echo "======= Running checkpoint-$i =======" |
|
|
|
|
|
model_path="/pfs/lichenyi/work/train_ddp/checkpoint-$i" |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
data_path="/pfs/lichenyi/work/evaluation/valid_in.json" |
|
|
|
|
|
torchrun --nproc_per_node 4 simple_valid.py \ |
|
|
--model_path "${model_path}" \ |
|
|
--out_path /pfs/lichenyi/work/evaluation/predictions_in \ |
|
|
--data_path "${data_path}" \ |
|
|
--dtype bf16 \ |
|
|
--use_system \ |
|
|
--temperature 0.0 |
|
|
|
|
|
python get_valid_score.py \ |
|
|
--pred_path "/pfs/lichenyi/work/evaluation/predictions_in/predictions_checkpoint-${i}.json" \ |
|
|
--out_path "/pfs/lichenyi/work/evaluation/valid_score_in_${i}.json" |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
data_path="/pfs/lichenyi/work/evaluation/valid_ood.json" |
|
|
|
|
|
torchrun --nproc_per_node 4 simple_valid.py \ |
|
|
--model_path "${model_path}" \ |
|
|
--data_path "${data_path}" \ |
|
|
--out_path /pfs/lichenyi/work/evaluation/predictions_ood \ |
|
|
--dtype bf16 \ |
|
|
--use_system \ |
|
|
--temperature 0.0 |
|
|
|
|
|
python get_valid_score.py \ |
|
|
--pred_path "/pfs/lichenyi/work/evaluation/predictions_ood/predictions_checkpoint-${i}.json" \ |
|
|
--out_path "/pfs/lichenyi/work/evaluation/valid_score_ood_${i}.json" |
|
|
|
|
|
done |
|
|
|