Upload root_scripts/launch_8gpu.sh with huggingface_hub
Browse files
root_scripts/launch_8gpu.sh
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
#!/bin/bash
|
| 2 |
+
cd /workspace/rl4phyx/RL4Phyx/SFT
|
| 3 |
+
export CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
|
| 4 |
+
export PYTHONUNBUFFERED=1
|
| 5 |
+
TIMESTAMP=$(date +%Y%m%d_%H%M%S)
|
| 6 |
+
LOG="/workspace/rl4phyx/logs/train_lora_phyx_math_f_8gpu_${TIMESTAMP}.log"
|
| 7 |
+
echo "Starting lora_phyx_math_f (8 GPUs, grad_accum=8, batch=64) at $(date)" > "$LOG"
|
| 8 |
+
torchrun --nproc_per_node=8 --master_port=29500 train_sft_phyx_math_lora_freeze.py >> "$LOG" 2>&1
|
| 9 |
+
echo "TRAINING_COMPLETE at $(date)" >> "$LOG"
|